{ "best_metric": 0.9214921903908192, "best_model_checkpoint": "./models/bart-base-spelling-nl-1m-3/checkpoint-177000", "epoch": 1.999985135567007, "global_step": 185004, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 0.0002999837841343971, "loss": 1.0202, "step": 10 }, { "epoch": 0.0, "learning_rate": 0.00029996756826879416, "loss": 0.2241, "step": 20 }, { "epoch": 0.0, "learning_rate": 0.0002999513524031912, "loss": 0.175, "step": 30 }, { "epoch": 0.0, "learning_rate": 0.00029993513653758834, "loss": 0.1532, "step": 40 }, { "epoch": 0.0, "learning_rate": 0.00029991892067198546, "loss": 0.1924, "step": 50 }, { "epoch": 0.0, "learning_rate": 0.00029990270480638253, "loss": 0.146, "step": 60 }, { "epoch": 0.0, "learning_rate": 0.00029988648894077965, "loss": 0.1704, "step": 70 }, { "epoch": 0.0, "learning_rate": 0.0002998702730751767, "loss": 0.157, "step": 80 }, { "epoch": 0.0, "learning_rate": 0.00029985405720957384, "loss": 0.1478, "step": 90 }, { "epoch": 0.0, "learning_rate": 0.00029983784134397096, "loss": 0.1327, "step": 100 }, { "epoch": 0.0, "learning_rate": 0.000299821625478368, "loss": 0.1403, "step": 110 }, { "epoch": 0.0, "learning_rate": 0.0002998054096127651, "loss": 0.1263, "step": 120 }, { "epoch": 0.0, "learning_rate": 0.0002997891937471622, "loss": 0.1305, "step": 130 }, { "epoch": 0.0, "learning_rate": 0.0002997729778815593, "loss": 0.1128, "step": 140 }, { "epoch": 0.0, "learning_rate": 0.0002997567620159564, "loss": 0.1263, "step": 150 }, { "epoch": 0.0, "learning_rate": 0.00029974054615035346, "loss": 0.1136, "step": 160 }, { "epoch": 0.0, "learning_rate": 0.0002997243302847506, "loss": 0.1132, "step": 170 }, { "epoch": 0.0, "learning_rate": 0.0002997081144191477, "loss": 0.1185, "step": 180 }, { "epoch": 0.0, "learning_rate": 0.00029969189855354476, "loss": 0.1145, "step": 190 }, { "epoch": 0.0, "learning_rate": 0.00029967568268794183, "loss": 0.1166, "step": 200 }, { "epoch": 0.0, "learning_rate": 0.00029965946682233895, "loss": 0.1197, "step": 210 }, { "epoch": 0.0, "learning_rate": 0.00029964325095673607, "loss": 0.1119, "step": 220 }, { "epoch": 0.0, "learning_rate": 0.00029962703509113313, "loss": 0.1056, "step": 230 }, { "epoch": 0.0, "learning_rate": 0.00029961081922553025, "loss": 0.1087, "step": 240 }, { "epoch": 0.0, "learning_rate": 0.0002995946033599273, "loss": 0.109, "step": 250 }, { "epoch": 0.0, "learning_rate": 0.00029957838749432444, "loss": 0.0968, "step": 260 }, { "epoch": 0.0, "learning_rate": 0.0002995621716287215, "loss": 0.1025, "step": 270 }, { "epoch": 0.0, "learning_rate": 0.0002995459557631186, "loss": 0.0981, "step": 280 }, { "epoch": 0.0, "learning_rate": 0.0002995297398975157, "loss": 0.1009, "step": 290 }, { "epoch": 0.0, "learning_rate": 0.0002995135240319128, "loss": 0.1017, "step": 300 }, { "epoch": 0.0, "learning_rate": 0.0002994973081663099, "loss": 0.1169, "step": 310 }, { "epoch": 0.0, "learning_rate": 0.000299481092300707, "loss": 0.1023, "step": 320 }, { "epoch": 0.0, "learning_rate": 0.00029946487643510406, "loss": 0.1122, "step": 330 }, { "epoch": 0.0, "learning_rate": 0.0002994486605695012, "loss": 0.0944, "step": 340 }, { "epoch": 0.0, "learning_rate": 0.00029943244470389825, "loss": 0.0995, "step": 350 }, { "epoch": 0.0, "learning_rate": 0.00029941622883829537, "loss": 0.0897, "step": 360 }, { "epoch": 0.0, "learning_rate": 0.0002994000129726925, "loss": 0.0936, "step": 370 }, { "epoch": 0.0, "learning_rate": 0.00029938379710708955, "loss": 0.0905, "step": 380 }, { "epoch": 0.0, "learning_rate": 0.0002993675812414866, "loss": 0.0891, "step": 390 }, { "epoch": 0.0, "learning_rate": 0.00029935136537588374, "loss": 0.0886, "step": 400 }, { "epoch": 0.0, "learning_rate": 0.00029933514951028086, "loss": 0.0872, "step": 410 }, { "epoch": 0.0, "learning_rate": 0.0002993189336446779, "loss": 0.0874, "step": 420 }, { "epoch": 0.0, "learning_rate": 0.000299302717779075, "loss": 0.0945, "step": 430 }, { "epoch": 0.0, "learning_rate": 0.0002992865019134721, "loss": 0.1135, "step": 440 }, { "epoch": 0.0, "learning_rate": 0.00029927028604786923, "loss": 0.1259, "step": 450 }, { "epoch": 0.0, "learning_rate": 0.0002992540701822663, "loss": 0.1149, "step": 460 }, { "epoch": 0.01, "learning_rate": 0.00029923785431666336, "loss": 0.1007, "step": 470 }, { "epoch": 0.01, "learning_rate": 0.0002992216384510605, "loss": 0.1059, "step": 480 }, { "epoch": 0.01, "learning_rate": 0.0002992054225854576, "loss": 0.1042, "step": 490 }, { "epoch": 0.01, "learning_rate": 0.00029918920671985467, "loss": 0.1074, "step": 500 }, { "epoch": 0.01, "learning_rate": 0.0002991729908542518, "loss": 0.093, "step": 510 }, { "epoch": 0.01, "learning_rate": 0.00029915677498864885, "loss": 0.1079, "step": 520 }, { "epoch": 0.01, "learning_rate": 0.00029914055912304597, "loss": 0.0862, "step": 530 }, { "epoch": 0.01, "learning_rate": 0.0002991243432574431, "loss": 0.0947, "step": 540 }, { "epoch": 0.01, "learning_rate": 0.00029910812739184016, "loss": 0.0835, "step": 550 }, { "epoch": 0.01, "learning_rate": 0.0002990919115262372, "loss": 0.0931, "step": 560 }, { "epoch": 0.01, "learning_rate": 0.00029907569566063434, "loss": 0.0853, "step": 570 }, { "epoch": 0.01, "learning_rate": 0.00029905947979503146, "loss": 0.0821, "step": 580 }, { "epoch": 0.01, "learning_rate": 0.0002990432639294285, "loss": 0.0911, "step": 590 }, { "epoch": 0.01, "learning_rate": 0.0002990270480638256, "loss": 0.0821, "step": 600 }, { "epoch": 0.01, "learning_rate": 0.0002990108321982227, "loss": 0.0909, "step": 610 }, { "epoch": 0.01, "learning_rate": 0.00029899461633261983, "loss": 0.0887, "step": 620 }, { "epoch": 0.01, "learning_rate": 0.0002989784004670169, "loss": 0.0853, "step": 630 }, { "epoch": 0.01, "learning_rate": 0.00029896218460141396, "loss": 0.0791, "step": 640 }, { "epoch": 0.01, "learning_rate": 0.0002989459687358111, "loss": 0.0788, "step": 650 }, { "epoch": 0.01, "learning_rate": 0.0002989297528702082, "loss": 0.0836, "step": 660 }, { "epoch": 0.01, "learning_rate": 0.00029891353700460527, "loss": 0.081, "step": 670 }, { "epoch": 0.01, "learning_rate": 0.0002988973211390024, "loss": 0.0799, "step": 680 }, { "epoch": 0.01, "learning_rate": 0.00029888110527339945, "loss": 0.0832, "step": 690 }, { "epoch": 0.01, "learning_rate": 0.0002988648894077966, "loss": 0.0746, "step": 700 }, { "epoch": 0.01, "learning_rate": 0.00029884867354219364, "loss": 0.0846, "step": 710 }, { "epoch": 0.01, "learning_rate": 0.00029883245767659076, "loss": 0.084, "step": 720 }, { "epoch": 0.01, "learning_rate": 0.0002988162418109878, "loss": 0.0793, "step": 730 }, { "epoch": 0.01, "learning_rate": 0.00029880002594538495, "loss": 0.0761, "step": 740 }, { "epoch": 0.01, "learning_rate": 0.00029878381007978207, "loss": 0.0768, "step": 750 }, { "epoch": 0.01, "learning_rate": 0.00029876759421417913, "loss": 0.0829, "step": 760 }, { "epoch": 0.01, "learning_rate": 0.0002987513783485762, "loss": 0.0768, "step": 770 }, { "epoch": 0.01, "learning_rate": 0.0002987351624829733, "loss": 0.0708, "step": 780 }, { "epoch": 0.01, "learning_rate": 0.00029871894661737044, "loss": 0.0757, "step": 790 }, { "epoch": 0.01, "learning_rate": 0.0002987027307517675, "loss": 0.0762, "step": 800 }, { "epoch": 0.01, "learning_rate": 0.0002986865148861646, "loss": 0.0788, "step": 810 }, { "epoch": 0.01, "learning_rate": 0.0002986702990205617, "loss": 0.0722, "step": 820 }, { "epoch": 0.01, "learning_rate": 0.0002986540831549588, "loss": 0.0891, "step": 830 }, { "epoch": 0.01, "learning_rate": 0.00029863786728935587, "loss": 0.0776, "step": 840 }, { "epoch": 0.01, "learning_rate": 0.000298621651423753, "loss": 0.0764, "step": 850 }, { "epoch": 0.01, "learning_rate": 0.00029860543555815006, "loss": 0.0751, "step": 860 }, { "epoch": 0.01, "learning_rate": 0.0002985892196925472, "loss": 0.0762, "step": 870 }, { "epoch": 0.01, "learning_rate": 0.00029857300382694424, "loss": 0.0757, "step": 880 }, { "epoch": 0.01, "learning_rate": 0.00029855678796134136, "loss": 0.0718, "step": 890 }, { "epoch": 0.01, "learning_rate": 0.00029854057209573843, "loss": 0.0736, "step": 900 }, { "epoch": 0.01, "learning_rate": 0.00029852435623013555, "loss": 0.078, "step": 910 }, { "epoch": 0.01, "learning_rate": 0.0002985081403645326, "loss": 0.0774, "step": 920 }, { "epoch": 0.01, "learning_rate": 0.00029849192449892973, "loss": 0.0727, "step": 930 }, { "epoch": 0.01, "learning_rate": 0.0002984757086333268, "loss": 0.0834, "step": 940 }, { "epoch": 0.01, "learning_rate": 0.0002984594927677239, "loss": 0.0811, "step": 950 }, { "epoch": 0.01, "learning_rate": 0.000298443276902121, "loss": 0.0768, "step": 960 }, { "epoch": 0.01, "learning_rate": 0.0002984270610365181, "loss": 0.0764, "step": 970 }, { "epoch": 0.01, "learning_rate": 0.0002984108451709152, "loss": 0.0817, "step": 980 }, { "epoch": 0.01, "learning_rate": 0.0002983946293053123, "loss": 0.0856, "step": 990 }, { "epoch": 0.01, "learning_rate": 0.00029837841343970936, "loss": 0.0834, "step": 1000 }, { "epoch": 0.01, "eval_cer": 0.9216337726727086, "eval_loss": 0.060326751321554184, "eval_runtime": 121.7661, "eval_samples_per_second": 16.425, "eval_steps_per_second": 4.106, "step": 1000 }, { "epoch": 0.01, "learning_rate": 0.0002983621975741065, "loss": 0.0711, "step": 1010 }, { "epoch": 0.01, "learning_rate": 0.0002983459817085036, "loss": 0.0706, "step": 1020 }, { "epoch": 0.01, "learning_rate": 0.00029832976584290066, "loss": 0.0661, "step": 1030 }, { "epoch": 0.01, "learning_rate": 0.00029831354997729773, "loss": 0.0843, "step": 1040 }, { "epoch": 0.01, "learning_rate": 0.00029829733411169485, "loss": 0.0696, "step": 1050 }, { "epoch": 0.01, "learning_rate": 0.00029828111824609197, "loss": 0.0796, "step": 1060 }, { "epoch": 0.01, "learning_rate": 0.00029826490238048903, "loss": 0.0737, "step": 1070 }, { "epoch": 0.01, "learning_rate": 0.00029824868651488615, "loss": 0.073, "step": 1080 }, { "epoch": 0.01, "learning_rate": 0.0002982324706492832, "loss": 0.0668, "step": 1090 }, { "epoch": 0.01, "learning_rate": 0.00029821625478368034, "loss": 0.076, "step": 1100 }, { "epoch": 0.01, "learning_rate": 0.00029820003891807746, "loss": 0.0771, "step": 1110 }, { "epoch": 0.01, "learning_rate": 0.0002981838230524745, "loss": 0.0652, "step": 1120 }, { "epoch": 0.01, "learning_rate": 0.0002981676071868716, "loss": 0.0713, "step": 1130 }, { "epoch": 0.01, "learning_rate": 0.0002981513913212687, "loss": 0.0709, "step": 1140 }, { "epoch": 0.01, "learning_rate": 0.00029813517545566583, "loss": 0.0741, "step": 1150 }, { "epoch": 0.01, "learning_rate": 0.0002981189595900629, "loss": 0.073, "step": 1160 }, { "epoch": 0.01, "learning_rate": 0.00029810274372445996, "loss": 0.063, "step": 1170 }, { "epoch": 0.01, "learning_rate": 0.0002980865278588571, "loss": 0.0682, "step": 1180 }, { "epoch": 0.01, "learning_rate": 0.0002980703119932542, "loss": 0.0699, "step": 1190 }, { "epoch": 0.01, "learning_rate": 0.00029805409612765127, "loss": 0.0667, "step": 1200 }, { "epoch": 0.01, "learning_rate": 0.00029803788026204833, "loss": 0.0717, "step": 1210 }, { "epoch": 0.01, "learning_rate": 0.00029802166439644545, "loss": 0.0657, "step": 1220 }, { "epoch": 0.01, "learning_rate": 0.00029800544853084257, "loss": 0.0761, "step": 1230 }, { "epoch": 0.01, "learning_rate": 0.00029798923266523964, "loss": 0.0801, "step": 1240 }, { "epoch": 0.01, "learning_rate": 0.00029797301679963676, "loss": 0.0712, "step": 1250 }, { "epoch": 0.01, "learning_rate": 0.0002979568009340338, "loss": 0.068, "step": 1260 }, { "epoch": 0.01, "learning_rate": 0.00029794058506843094, "loss": 0.0628, "step": 1270 }, { "epoch": 0.01, "learning_rate": 0.000297924369202828, "loss": 0.0705, "step": 1280 }, { "epoch": 0.01, "learning_rate": 0.00029790815333722513, "loss": 0.0692, "step": 1290 }, { "epoch": 0.01, "learning_rate": 0.0002978919374716222, "loss": 0.0786, "step": 1300 }, { "epoch": 0.01, "learning_rate": 0.0002978757216060193, "loss": 0.0775, "step": 1310 }, { "epoch": 0.01, "learning_rate": 0.0002978595057404164, "loss": 0.0664, "step": 1320 }, { "epoch": 0.01, "learning_rate": 0.0002978432898748135, "loss": 0.0603, "step": 1330 }, { "epoch": 0.01, "learning_rate": 0.00029782707400921056, "loss": 0.0608, "step": 1340 }, { "epoch": 0.01, "learning_rate": 0.0002978108581436077, "loss": 0.0627, "step": 1350 }, { "epoch": 0.01, "learning_rate": 0.00029779464227800475, "loss": 0.0677, "step": 1360 }, { "epoch": 0.01, "learning_rate": 0.00029777842641240187, "loss": 0.0728, "step": 1370 }, { "epoch": 0.01, "learning_rate": 0.000297762210546799, "loss": 0.0751, "step": 1380 }, { "epoch": 0.02, "learning_rate": 0.00029774599468119605, "loss": 0.0666, "step": 1390 }, { "epoch": 0.02, "learning_rate": 0.0002977297788155931, "loss": 0.0664, "step": 1400 }, { "epoch": 0.02, "learning_rate": 0.00029771356294999024, "loss": 0.0645, "step": 1410 }, { "epoch": 0.02, "learning_rate": 0.00029769734708438736, "loss": 0.0714, "step": 1420 }, { "epoch": 0.02, "learning_rate": 0.0002976811312187844, "loss": 0.0743, "step": 1430 }, { "epoch": 0.02, "learning_rate": 0.00029766491535318155, "loss": 0.0631, "step": 1440 }, { "epoch": 0.02, "learning_rate": 0.0002976486994875786, "loss": 0.0612, "step": 1450 }, { "epoch": 0.02, "learning_rate": 0.00029763248362197573, "loss": 0.0598, "step": 1460 }, { "epoch": 0.02, "learning_rate": 0.0002976162677563728, "loss": 0.058, "step": 1470 }, { "epoch": 0.02, "learning_rate": 0.0002976000518907699, "loss": 0.064, "step": 1480 }, { "epoch": 0.02, "learning_rate": 0.000297583836025167, "loss": 0.0575, "step": 1490 }, { "epoch": 0.02, "learning_rate": 0.0002975676201595641, "loss": 0.0634, "step": 1500 }, { "epoch": 0.02, "learning_rate": 0.00029755140429396117, "loss": 0.06, "step": 1510 }, { "epoch": 0.02, "learning_rate": 0.0002975351884283583, "loss": 0.0562, "step": 1520 }, { "epoch": 0.02, "learning_rate": 0.00029751897256275535, "loss": 0.0716, "step": 1530 }, { "epoch": 0.02, "learning_rate": 0.0002975027566971525, "loss": 0.0696, "step": 1540 }, { "epoch": 0.02, "learning_rate": 0.0002974865408315496, "loss": 0.0671, "step": 1550 }, { "epoch": 0.02, "learning_rate": 0.00029747032496594666, "loss": 0.0796, "step": 1560 }, { "epoch": 0.02, "learning_rate": 0.0002974541091003437, "loss": 0.0591, "step": 1570 }, { "epoch": 0.02, "learning_rate": 0.00029743789323474084, "loss": 0.0684, "step": 1580 }, { "epoch": 0.02, "learning_rate": 0.00029742167736913796, "loss": 0.0634, "step": 1590 }, { "epoch": 0.02, "learning_rate": 0.00029740546150353503, "loss": 0.0703, "step": 1600 }, { "epoch": 0.02, "learning_rate": 0.0002973892456379321, "loss": 0.0554, "step": 1610 }, { "epoch": 0.02, "learning_rate": 0.0002973730297723292, "loss": 0.0745, "step": 1620 }, { "epoch": 0.02, "learning_rate": 0.00029735681390672633, "loss": 0.0601, "step": 1630 }, { "epoch": 0.02, "learning_rate": 0.0002973405980411234, "loss": 0.0676, "step": 1640 }, { "epoch": 0.02, "learning_rate": 0.00029732438217552047, "loss": 0.0643, "step": 1650 }, { "epoch": 0.02, "learning_rate": 0.0002973081663099176, "loss": 0.0646, "step": 1660 }, { "epoch": 0.02, "learning_rate": 0.0002972919504443147, "loss": 0.0567, "step": 1670 }, { "epoch": 0.02, "learning_rate": 0.0002972757345787118, "loss": 0.0657, "step": 1680 }, { "epoch": 0.02, "learning_rate": 0.0002972595187131089, "loss": 0.0624, "step": 1690 }, { "epoch": 0.02, "learning_rate": 0.00029724330284750596, "loss": 0.0657, "step": 1700 }, { "epoch": 0.02, "learning_rate": 0.0002972270869819031, "loss": 0.0537, "step": 1710 }, { "epoch": 0.02, "learning_rate": 0.0002972108711163002, "loss": 0.0571, "step": 1720 }, { "epoch": 0.02, "learning_rate": 0.00029719465525069726, "loss": 0.0607, "step": 1730 }, { "epoch": 0.02, "learning_rate": 0.00029717843938509433, "loss": 0.0585, "step": 1740 }, { "epoch": 0.02, "learning_rate": 0.00029716222351949145, "loss": 0.0573, "step": 1750 }, { "epoch": 0.02, "learning_rate": 0.00029714600765388857, "loss": 0.0684, "step": 1760 }, { "epoch": 0.02, "learning_rate": 0.00029712979178828563, "loss": 0.0589, "step": 1770 }, { "epoch": 0.02, "learning_rate": 0.0002971135759226827, "loss": 0.0581, "step": 1780 }, { "epoch": 0.02, "learning_rate": 0.0002970973600570798, "loss": 0.0578, "step": 1790 }, { "epoch": 0.02, "learning_rate": 0.00029708114419147694, "loss": 0.0646, "step": 1800 }, { "epoch": 0.02, "learning_rate": 0.000297064928325874, "loss": 0.0542, "step": 1810 }, { "epoch": 0.02, "learning_rate": 0.0002970487124602711, "loss": 0.0683, "step": 1820 }, { "epoch": 0.02, "learning_rate": 0.0002970324965946682, "loss": 0.0626, "step": 1830 }, { "epoch": 0.02, "learning_rate": 0.0002970162807290653, "loss": 0.0561, "step": 1840 }, { "epoch": 0.02, "learning_rate": 0.0002970000648634624, "loss": 0.0681, "step": 1850 }, { "epoch": 0.02, "learning_rate": 0.0002969838489978595, "loss": 0.0608, "step": 1860 }, { "epoch": 0.02, "learning_rate": 0.00029696763313225656, "loss": 0.057, "step": 1870 }, { "epoch": 0.02, "learning_rate": 0.0002969514172666537, "loss": 0.0527, "step": 1880 }, { "epoch": 0.02, "learning_rate": 0.00029693520140105075, "loss": 0.0584, "step": 1890 }, { "epoch": 0.02, "learning_rate": 0.00029691898553544787, "loss": 0.0569, "step": 1900 }, { "epoch": 0.02, "learning_rate": 0.00029690276966984493, "loss": 0.0585, "step": 1910 }, { "epoch": 0.02, "learning_rate": 0.00029688655380424205, "loss": 0.0538, "step": 1920 }, { "epoch": 0.02, "learning_rate": 0.0002968703379386391, "loss": 0.0621, "step": 1930 }, { "epoch": 0.02, "learning_rate": 0.00029685412207303624, "loss": 0.0637, "step": 1940 }, { "epoch": 0.02, "learning_rate": 0.0002968379062074333, "loss": 0.0613, "step": 1950 }, { "epoch": 0.02, "learning_rate": 0.0002968216903418304, "loss": 0.0589, "step": 1960 }, { "epoch": 0.02, "learning_rate": 0.0002968054744762275, "loss": 0.0596, "step": 1970 }, { "epoch": 0.02, "learning_rate": 0.0002967892586106246, "loss": 0.0617, "step": 1980 }, { "epoch": 0.02, "learning_rate": 0.00029677304274502173, "loss": 0.0621, "step": 1990 }, { "epoch": 0.02, "learning_rate": 0.0002967568268794188, "loss": 0.0566, "step": 2000 }, { "epoch": 0.02, "eval_cer": 0.9216580935554872, "eval_loss": 0.04665278643369675, "eval_runtime": 120.2206, "eval_samples_per_second": 16.636, "eval_steps_per_second": 4.159, "step": 2000 }, { "epoch": 0.02, "learning_rate": 0.00029674061101381586, "loss": 0.0507, "step": 2010 }, { "epoch": 0.02, "learning_rate": 0.000296724395148213, "loss": 0.0582, "step": 2020 }, { "epoch": 0.02, "learning_rate": 0.0002967081792826101, "loss": 0.0521, "step": 2030 }, { "epoch": 0.02, "learning_rate": 0.00029669196341700716, "loss": 0.052, "step": 2040 }, { "epoch": 0.02, "learning_rate": 0.00029667574755140423, "loss": 0.0567, "step": 2050 }, { "epoch": 0.02, "learning_rate": 0.00029665953168580135, "loss": 0.0617, "step": 2060 }, { "epoch": 0.02, "learning_rate": 0.00029664331582019847, "loss": 0.055, "step": 2070 }, { "epoch": 0.02, "learning_rate": 0.00029662709995459554, "loss": 0.0628, "step": 2080 }, { "epoch": 0.02, "learning_rate": 0.00029661088408899266, "loss": 0.0618, "step": 2090 }, { "epoch": 0.02, "learning_rate": 0.0002965946682233897, "loss": 0.0605, "step": 2100 }, { "epoch": 0.02, "learning_rate": 0.00029657845235778684, "loss": 0.0616, "step": 2110 }, { "epoch": 0.02, "learning_rate": 0.00029656223649218396, "loss": 0.0598, "step": 2120 }, { "epoch": 0.02, "learning_rate": 0.000296546020626581, "loss": 0.0571, "step": 2130 }, { "epoch": 0.02, "learning_rate": 0.0002965298047609781, "loss": 0.057, "step": 2140 }, { "epoch": 0.02, "learning_rate": 0.0002965135888953752, "loss": 0.0558, "step": 2150 }, { "epoch": 0.02, "learning_rate": 0.00029649737302977233, "loss": 0.0622, "step": 2160 }, { "epoch": 0.02, "learning_rate": 0.0002964811571641694, "loss": 0.0626, "step": 2170 }, { "epoch": 0.02, "learning_rate": 0.00029646494129856646, "loss": 0.0616, "step": 2180 }, { "epoch": 0.02, "learning_rate": 0.0002964487254329636, "loss": 0.0608, "step": 2190 }, { "epoch": 0.02, "learning_rate": 0.0002964325095673607, "loss": 0.0878, "step": 2200 }, { "epoch": 0.02, "learning_rate": 0.00029641629370175777, "loss": 0.0637, "step": 2210 }, { "epoch": 0.02, "learning_rate": 0.00029640007783615483, "loss": 0.0616, "step": 2220 }, { "epoch": 0.02, "learning_rate": 0.00029638386197055195, "loss": 0.0678, "step": 2230 }, { "epoch": 0.02, "learning_rate": 0.0002963676461049491, "loss": 0.0612, "step": 2240 }, { "epoch": 0.02, "learning_rate": 0.00029635143023934614, "loss": 0.0623, "step": 2250 }, { "epoch": 0.02, "learning_rate": 0.00029633521437374326, "loss": 0.0631, "step": 2260 }, { "epoch": 0.02, "learning_rate": 0.0002963189985081403, "loss": 0.0651, "step": 2270 }, { "epoch": 0.02, "learning_rate": 0.00029630278264253744, "loss": 0.0596, "step": 2280 }, { "epoch": 0.02, "learning_rate": 0.00029628656677693456, "loss": 0.0705, "step": 2290 }, { "epoch": 0.02, "learning_rate": 0.00029627035091133163, "loss": 0.0786, "step": 2300 }, { "epoch": 0.02, "learning_rate": 0.0002962541350457287, "loss": 0.0724, "step": 2310 }, { "epoch": 0.03, "learning_rate": 0.0002962379191801258, "loss": 0.0981, "step": 2320 }, { "epoch": 0.03, "learning_rate": 0.00029622170331452294, "loss": 0.0646, "step": 2330 }, { "epoch": 0.03, "learning_rate": 0.00029620548744892, "loss": 0.0593, "step": 2340 }, { "epoch": 0.03, "learning_rate": 0.00029618927158331707, "loss": 0.0509, "step": 2350 }, { "epoch": 0.03, "learning_rate": 0.0002961730557177142, "loss": 0.0699, "step": 2360 }, { "epoch": 0.03, "learning_rate": 0.0002961568398521113, "loss": 0.0686, "step": 2370 }, { "epoch": 0.03, "learning_rate": 0.00029614062398650837, "loss": 0.0529, "step": 2380 }, { "epoch": 0.03, "learning_rate": 0.0002961244081209055, "loss": 0.0706, "step": 2390 }, { "epoch": 0.03, "learning_rate": 0.00029610819225530256, "loss": 0.0655, "step": 2400 }, { "epoch": 0.03, "learning_rate": 0.0002960919763896997, "loss": 0.0581, "step": 2410 }, { "epoch": 0.03, "learning_rate": 0.00029607576052409674, "loss": 0.0604, "step": 2420 }, { "epoch": 0.03, "learning_rate": 0.00029605954465849386, "loss": 0.0583, "step": 2430 }, { "epoch": 0.03, "learning_rate": 0.00029604332879289093, "loss": 0.0576, "step": 2440 }, { "epoch": 0.03, "learning_rate": 0.00029602711292728805, "loss": 0.0636, "step": 2450 }, { "epoch": 0.03, "learning_rate": 0.0002960108970616851, "loss": 0.0678, "step": 2460 }, { "epoch": 0.03, "learning_rate": 0.00029599468119608223, "loss": 0.0663, "step": 2470 }, { "epoch": 0.03, "learning_rate": 0.0002959784653304793, "loss": 0.0704, "step": 2480 }, { "epoch": 0.03, "learning_rate": 0.0002959622494648764, "loss": 0.0627, "step": 2490 }, { "epoch": 0.03, "learning_rate": 0.0002959460335992735, "loss": 0.0652, "step": 2500 }, { "epoch": 0.03, "learning_rate": 0.0002959298177336706, "loss": 0.107, "step": 2510 }, { "epoch": 0.03, "learning_rate": 0.00029591360186806767, "loss": 0.0693, "step": 2520 }, { "epoch": 0.03, "learning_rate": 0.0002958973860024648, "loss": 0.0684, "step": 2530 }, { "epoch": 0.03, "learning_rate": 0.00029588117013686186, "loss": 0.0637, "step": 2540 }, { "epoch": 0.03, "learning_rate": 0.000295864954271259, "loss": 0.0638, "step": 2550 }, { "epoch": 0.03, "learning_rate": 0.0002958487384056561, "loss": 0.0628, "step": 2560 }, { "epoch": 0.03, "learning_rate": 0.00029583252254005316, "loss": 0.0535, "step": 2570 }, { "epoch": 0.03, "learning_rate": 0.0002958163066744502, "loss": 0.0551, "step": 2580 }, { "epoch": 0.03, "learning_rate": 0.00029580009080884735, "loss": 0.059, "step": 2590 }, { "epoch": 0.03, "learning_rate": 0.00029578387494324447, "loss": 0.0605, "step": 2600 }, { "epoch": 0.03, "learning_rate": 0.00029576765907764153, "loss": 0.0634, "step": 2610 }, { "epoch": 0.03, "learning_rate": 0.0002957514432120386, "loss": 0.0554, "step": 2620 }, { "epoch": 0.03, "learning_rate": 0.0002957352273464357, "loss": 0.0548, "step": 2630 }, { "epoch": 0.03, "learning_rate": 0.00029571901148083284, "loss": 0.069, "step": 2640 }, { "epoch": 0.03, "learning_rate": 0.0002957027956152299, "loss": 0.0634, "step": 2650 }, { "epoch": 0.03, "learning_rate": 0.00029568657974962697, "loss": 0.0618, "step": 2660 }, { "epoch": 0.03, "learning_rate": 0.0002956703638840241, "loss": 0.0575, "step": 2670 }, { "epoch": 0.03, "learning_rate": 0.0002956541480184212, "loss": 0.0509, "step": 2680 }, { "epoch": 0.03, "learning_rate": 0.00029563793215281833, "loss": 0.0528, "step": 2690 }, { "epoch": 0.03, "learning_rate": 0.0002956217162872154, "loss": 0.0606, "step": 2700 }, { "epoch": 0.03, "learning_rate": 0.00029560550042161246, "loss": 0.0648, "step": 2710 }, { "epoch": 0.03, "learning_rate": 0.0002955892845560096, "loss": 0.0544, "step": 2720 }, { "epoch": 0.03, "learning_rate": 0.0002955730686904067, "loss": 0.0568, "step": 2730 }, { "epoch": 0.03, "learning_rate": 0.00029555685282480376, "loss": 0.0553, "step": 2740 }, { "epoch": 0.03, "learning_rate": 0.00029554063695920083, "loss": 0.0549, "step": 2750 }, { "epoch": 0.03, "learning_rate": 0.00029552442109359795, "loss": 0.0879, "step": 2760 }, { "epoch": 0.03, "learning_rate": 0.00029550820522799507, "loss": 0.0844, "step": 2770 }, { "epoch": 0.03, "learning_rate": 0.00029549198936239214, "loss": 0.0894, "step": 2780 }, { "epoch": 0.03, "learning_rate": 0.0002954757734967892, "loss": 0.0779, "step": 2790 }, { "epoch": 0.03, "learning_rate": 0.0002954595576311863, "loss": 0.0667, "step": 2800 }, { "epoch": 0.03, "learning_rate": 0.00029544334176558344, "loss": 0.0704, "step": 2810 }, { "epoch": 0.03, "learning_rate": 0.0002954271258999805, "loss": 0.0616, "step": 2820 }, { "epoch": 0.03, "learning_rate": 0.0002954109100343776, "loss": 0.0584, "step": 2830 }, { "epoch": 0.03, "learning_rate": 0.0002953946941687747, "loss": 0.0918, "step": 2840 }, { "epoch": 0.03, "learning_rate": 0.0002953784783031718, "loss": 0.0701, "step": 2850 }, { "epoch": 0.03, "learning_rate": 0.0002953622624375689, "loss": 0.0725, "step": 2860 }, { "epoch": 0.03, "learning_rate": 0.000295346046571966, "loss": 0.0636, "step": 2870 }, { "epoch": 0.03, "learning_rate": 0.00029532983070636306, "loss": 0.0612, "step": 2880 }, { "epoch": 0.03, "learning_rate": 0.0002953136148407602, "loss": 0.0669, "step": 2890 }, { "epoch": 0.03, "learning_rate": 0.0002952973989751573, "loss": 0.0568, "step": 2900 }, { "epoch": 0.03, "learning_rate": 0.00029528118310955437, "loss": 0.0551, "step": 2910 }, { "epoch": 0.03, "learning_rate": 0.00029526496724395143, "loss": 0.0648, "step": 2920 }, { "epoch": 0.03, "learning_rate": 0.00029524875137834855, "loss": 0.061, "step": 2930 }, { "epoch": 0.03, "learning_rate": 0.0002952325355127457, "loss": 0.0547, "step": 2940 }, { "epoch": 0.03, "learning_rate": 0.00029521631964714274, "loss": 0.0637, "step": 2950 }, { "epoch": 0.03, "learning_rate": 0.0002952001037815398, "loss": 0.0606, "step": 2960 }, { "epoch": 0.03, "learning_rate": 0.0002951838879159369, "loss": 0.0546, "step": 2970 }, { "epoch": 0.03, "learning_rate": 0.00029516767205033404, "loss": 0.0545, "step": 2980 }, { "epoch": 0.03, "learning_rate": 0.0002951514561847311, "loss": 0.0598, "step": 2990 }, { "epoch": 0.03, "learning_rate": 0.00029513524031912823, "loss": 0.0534, "step": 3000 }, { "epoch": 0.03, "eval_cer": 0.921613794804712, "eval_loss": 0.04357113689184189, "eval_runtime": 120.9669, "eval_samples_per_second": 16.533, "eval_steps_per_second": 4.133, "step": 3000 }, { "epoch": 0.03, "learning_rate": 0.0002951190244535253, "loss": 0.0794, "step": 3010 }, { "epoch": 0.03, "learning_rate": 0.0002951028085879224, "loss": 0.0604, "step": 3020 }, { "epoch": 0.03, "learning_rate": 0.0002950865927223195, "loss": 0.0512, "step": 3030 }, { "epoch": 0.03, "learning_rate": 0.0002950703768567166, "loss": 0.0569, "step": 3040 }, { "epoch": 0.03, "learning_rate": 0.00029505416099111367, "loss": 0.0507, "step": 3050 }, { "epoch": 0.03, "learning_rate": 0.0002950379451255108, "loss": 0.0652, "step": 3060 }, { "epoch": 0.03, "learning_rate": 0.00029502172925990785, "loss": 0.0545, "step": 3070 }, { "epoch": 0.03, "learning_rate": 0.00029500551339430497, "loss": 0.0499, "step": 3080 }, { "epoch": 0.03, "learning_rate": 0.00029498929752870204, "loss": 0.0525, "step": 3090 }, { "epoch": 0.03, "learning_rate": 0.00029497308166309916, "loss": 0.0599, "step": 3100 }, { "epoch": 0.03, "learning_rate": 0.0002949568657974962, "loss": 0.0604, "step": 3110 }, { "epoch": 0.03, "learning_rate": 0.00029494064993189334, "loss": 0.0561, "step": 3120 }, { "epoch": 0.03, "learning_rate": 0.00029492443406629046, "loss": 0.0602, "step": 3130 }, { "epoch": 0.03, "learning_rate": 0.00029490821820068753, "loss": 0.0542, "step": 3140 }, { "epoch": 0.03, "learning_rate": 0.0002948920023350846, "loss": 0.0548, "step": 3150 }, { "epoch": 0.03, "learning_rate": 0.0002948757864694817, "loss": 0.0596, "step": 3160 }, { "epoch": 0.03, "learning_rate": 0.00029485957060387883, "loss": 0.063, "step": 3170 }, { "epoch": 0.03, "learning_rate": 0.0002948433547382759, "loss": 0.0487, "step": 3180 }, { "epoch": 0.03, "learning_rate": 0.00029482713887267297, "loss": 0.0576, "step": 3190 }, { "epoch": 0.03, "learning_rate": 0.0002948109230070701, "loss": 0.0473, "step": 3200 }, { "epoch": 0.03, "learning_rate": 0.0002947947071414672, "loss": 0.0506, "step": 3210 }, { "epoch": 0.03, "learning_rate": 0.00029477849127586427, "loss": 0.0471, "step": 3220 }, { "epoch": 0.03, "learning_rate": 0.00029476227541026134, "loss": 0.0512, "step": 3230 }, { "epoch": 0.04, "learning_rate": 0.00029474605954465846, "loss": 0.0533, "step": 3240 }, { "epoch": 0.04, "learning_rate": 0.0002947298436790556, "loss": 0.0494, "step": 3250 }, { "epoch": 0.04, "learning_rate": 0.00029471362781345264, "loss": 0.0542, "step": 3260 }, { "epoch": 0.04, "learning_rate": 0.00029469741194784976, "loss": 0.0538, "step": 3270 }, { "epoch": 0.04, "learning_rate": 0.00029468119608224683, "loss": 0.0462, "step": 3280 }, { "epoch": 0.04, "learning_rate": 0.00029466498021664395, "loss": 0.058, "step": 3290 }, { "epoch": 0.04, "learning_rate": 0.00029464876435104107, "loss": 0.0448, "step": 3300 }, { "epoch": 0.04, "learning_rate": 0.00029463254848543813, "loss": 0.0527, "step": 3310 }, { "epoch": 0.04, "learning_rate": 0.0002946163326198352, "loss": 0.0513, "step": 3320 }, { "epoch": 0.04, "learning_rate": 0.0002946001167542323, "loss": 0.0503, "step": 3330 }, { "epoch": 0.04, "learning_rate": 0.00029458390088862944, "loss": 0.0506, "step": 3340 }, { "epoch": 0.04, "learning_rate": 0.0002945676850230265, "loss": 0.0514, "step": 3350 }, { "epoch": 0.04, "learning_rate": 0.00029455146915742357, "loss": 0.0524, "step": 3360 }, { "epoch": 0.04, "learning_rate": 0.0002945352532918207, "loss": 0.0501, "step": 3370 }, { "epoch": 0.04, "learning_rate": 0.0002945190374262178, "loss": 0.0514, "step": 3380 }, { "epoch": 0.04, "learning_rate": 0.0002945028215606149, "loss": 0.0543, "step": 3390 }, { "epoch": 0.04, "learning_rate": 0.000294486605695012, "loss": 0.0464, "step": 3400 }, { "epoch": 0.04, "learning_rate": 0.00029447038982940906, "loss": 0.053, "step": 3410 }, { "epoch": 0.04, "learning_rate": 0.0002944541739638062, "loss": 0.0567, "step": 3420 }, { "epoch": 0.04, "learning_rate": 0.00029443795809820325, "loss": 0.0575, "step": 3430 }, { "epoch": 0.04, "learning_rate": 0.00029442174223260037, "loss": 0.0517, "step": 3440 }, { "epoch": 0.04, "learning_rate": 0.00029440552636699743, "loss": 0.0567, "step": 3450 }, { "epoch": 0.04, "learning_rate": 0.00029438931050139455, "loss": 0.0462, "step": 3460 }, { "epoch": 0.04, "learning_rate": 0.0002943730946357916, "loss": 0.0662, "step": 3470 }, { "epoch": 0.04, "learning_rate": 0.00029435687877018874, "loss": 0.0505, "step": 3480 }, { "epoch": 0.04, "learning_rate": 0.0002943406629045858, "loss": 0.0458, "step": 3490 }, { "epoch": 0.04, "learning_rate": 0.0002943244470389829, "loss": 0.0491, "step": 3500 }, { "epoch": 0.04, "learning_rate": 0.00029430823117338, "loss": 0.054, "step": 3510 }, { "epoch": 0.04, "learning_rate": 0.0002942920153077771, "loss": 0.0461, "step": 3520 }, { "epoch": 0.04, "learning_rate": 0.0002942757994421742, "loss": 0.0514, "step": 3530 }, { "epoch": 0.04, "learning_rate": 0.0002942595835765713, "loss": 0.0542, "step": 3540 }, { "epoch": 0.04, "learning_rate": 0.00029424336771096836, "loss": 0.0551, "step": 3550 }, { "epoch": 0.04, "learning_rate": 0.0002942271518453655, "loss": 0.0516, "step": 3560 }, { "epoch": 0.04, "learning_rate": 0.0002942109359797626, "loss": 0.0505, "step": 3570 }, { "epoch": 0.04, "learning_rate": 0.00029419472011415966, "loss": 0.0451, "step": 3580 }, { "epoch": 0.04, "learning_rate": 0.00029417850424855673, "loss": 0.0477, "step": 3590 }, { "epoch": 0.04, "learning_rate": 0.00029416228838295385, "loss": 0.0485, "step": 3600 }, { "epoch": 0.04, "learning_rate": 0.00029414607251735097, "loss": 0.0523, "step": 3610 }, { "epoch": 0.04, "learning_rate": 0.00029412985665174803, "loss": 0.0448, "step": 3620 }, { "epoch": 0.04, "learning_rate": 0.00029411364078614515, "loss": 0.0512, "step": 3630 }, { "epoch": 0.04, "learning_rate": 0.0002940974249205422, "loss": 0.0461, "step": 3640 }, { "epoch": 0.04, "learning_rate": 0.00029408120905493934, "loss": 0.0471, "step": 3650 }, { "epoch": 0.04, "learning_rate": 0.0002940649931893364, "loss": 0.0474, "step": 3660 }, { "epoch": 0.04, "learning_rate": 0.0002940487773237335, "loss": 0.0832, "step": 3670 }, { "epoch": 0.04, "learning_rate": 0.0002940325614581306, "loss": 0.0521, "step": 3680 }, { "epoch": 0.04, "learning_rate": 0.0002940163455925277, "loss": 0.0659, "step": 3690 }, { "epoch": 0.04, "learning_rate": 0.00029400012972692483, "loss": 0.0498, "step": 3700 }, { "epoch": 0.04, "learning_rate": 0.0002939839138613219, "loss": 0.0465, "step": 3710 }, { "epoch": 0.04, "learning_rate": 0.00029396769799571896, "loss": 0.0456, "step": 3720 }, { "epoch": 0.04, "learning_rate": 0.0002939514821301161, "loss": 0.0468, "step": 3730 }, { "epoch": 0.04, "learning_rate": 0.0002939352662645132, "loss": 0.0467, "step": 3740 }, { "epoch": 0.04, "learning_rate": 0.00029391905039891027, "loss": 0.0446, "step": 3750 }, { "epoch": 0.04, "learning_rate": 0.00029390283453330733, "loss": 0.0486, "step": 3760 }, { "epoch": 0.04, "learning_rate": 0.00029388661866770445, "loss": 0.0536, "step": 3770 }, { "epoch": 0.04, "learning_rate": 0.00029387040280210157, "loss": 0.0519, "step": 3780 }, { "epoch": 0.04, "learning_rate": 0.00029385418693649864, "loss": 0.0512, "step": 3790 }, { "epoch": 0.04, "learning_rate": 0.0002938379710708957, "loss": 0.0444, "step": 3800 }, { "epoch": 0.04, "learning_rate": 0.0002938217552052928, "loss": 0.0525, "step": 3810 }, { "epoch": 0.04, "learning_rate": 0.00029380553933968994, "loss": 0.0557, "step": 3820 }, { "epoch": 0.04, "learning_rate": 0.000293789323474087, "loss": 0.0452, "step": 3830 }, { "epoch": 0.04, "learning_rate": 0.00029377310760848413, "loss": 0.0489, "step": 3840 }, { "epoch": 0.04, "learning_rate": 0.0002937568917428812, "loss": 0.0488, "step": 3850 }, { "epoch": 0.04, "learning_rate": 0.0002937406758772783, "loss": 0.0529, "step": 3860 }, { "epoch": 0.04, "learning_rate": 0.00029372446001167543, "loss": 0.0482, "step": 3870 }, { "epoch": 0.04, "learning_rate": 0.0002937082441460725, "loss": 0.049, "step": 3880 }, { "epoch": 0.04, "learning_rate": 0.00029369202828046957, "loss": 0.0559, "step": 3890 }, { "epoch": 0.04, "learning_rate": 0.0002936758124148667, "loss": 0.0563, "step": 3900 }, { "epoch": 0.04, "learning_rate": 0.0002936595965492638, "loss": 0.0492, "step": 3910 }, { "epoch": 0.04, "learning_rate": 0.00029364338068366087, "loss": 0.0468, "step": 3920 }, { "epoch": 0.04, "learning_rate": 0.00029362716481805794, "loss": 0.0459, "step": 3930 }, { "epoch": 0.04, "learning_rate": 0.00029361094895245506, "loss": 0.051, "step": 3940 }, { "epoch": 0.04, "learning_rate": 0.0002935947330868522, "loss": 0.0491, "step": 3950 }, { "epoch": 0.04, "learning_rate": 0.00029357851722124924, "loss": 0.049, "step": 3960 }, { "epoch": 0.04, "learning_rate": 0.0002935623013556463, "loss": 0.0447, "step": 3970 }, { "epoch": 0.04, "learning_rate": 0.00029354608549004343, "loss": 0.0549, "step": 3980 }, { "epoch": 0.04, "learning_rate": 0.00029352986962444055, "loss": 0.059, "step": 3990 }, { "epoch": 0.04, "learning_rate": 0.0002935136537588376, "loss": 0.0461, "step": 4000 }, { "epoch": 0.04, "eval_cer": 0.9216346412756651, "eval_loss": 0.03921321779489517, "eval_runtime": 120.7862, "eval_samples_per_second": 16.558, "eval_steps_per_second": 4.14, "step": 4000 }, { "epoch": 0.04, "learning_rate": 0.00029349743789323473, "loss": 0.0531, "step": 4010 }, { "epoch": 0.04, "learning_rate": 0.0002934812220276318, "loss": 0.0441, "step": 4020 }, { "epoch": 0.04, "learning_rate": 0.0002934650061620289, "loss": 0.0453, "step": 4030 }, { "epoch": 0.04, "learning_rate": 0.000293448790296426, "loss": 0.0461, "step": 4040 }, { "epoch": 0.04, "learning_rate": 0.0002934325744308231, "loss": 0.0509, "step": 4050 }, { "epoch": 0.04, "learning_rate": 0.00029341635856522017, "loss": 0.0471, "step": 4060 }, { "epoch": 0.04, "learning_rate": 0.0002934001426996173, "loss": 0.0445, "step": 4070 }, { "epoch": 0.04, "learning_rate": 0.00029338392683401436, "loss": 0.0531, "step": 4080 }, { "epoch": 0.04, "learning_rate": 0.0002933677109684115, "loss": 0.0472, "step": 4090 }, { "epoch": 0.04, "learning_rate": 0.00029335149510280854, "loss": 0.041, "step": 4100 }, { "epoch": 0.04, "learning_rate": 0.00029333527923720566, "loss": 0.0445, "step": 4110 }, { "epoch": 0.04, "learning_rate": 0.0002933190633716027, "loss": 0.0518, "step": 4120 }, { "epoch": 0.04, "learning_rate": 0.00029330284750599985, "loss": 0.0531, "step": 4130 }, { "epoch": 0.04, "learning_rate": 0.00029328663164039697, "loss": 0.0456, "step": 4140 }, { "epoch": 0.04, "learning_rate": 0.00029327041577479403, "loss": 0.0544, "step": 4150 }, { "epoch": 0.04, "learning_rate": 0.0002932541999091911, "loss": 0.0403, "step": 4160 }, { "epoch": 0.05, "learning_rate": 0.0002932379840435882, "loss": 0.0537, "step": 4170 }, { "epoch": 0.05, "learning_rate": 0.00029322176817798534, "loss": 0.0502, "step": 4180 }, { "epoch": 0.05, "learning_rate": 0.0002932055523123824, "loss": 0.0509, "step": 4190 }, { "epoch": 0.05, "learning_rate": 0.00029318933644677947, "loss": 0.0528, "step": 4200 }, { "epoch": 0.05, "learning_rate": 0.0002931731205811766, "loss": 0.0469, "step": 4210 }, { "epoch": 0.05, "learning_rate": 0.0002931569047155737, "loss": 0.0511, "step": 4220 }, { "epoch": 0.05, "learning_rate": 0.0002931406888499708, "loss": 0.0527, "step": 4230 }, { "epoch": 0.05, "learning_rate": 0.00029312447298436784, "loss": 0.0511, "step": 4240 }, { "epoch": 0.05, "learning_rate": 0.00029310825711876496, "loss": 0.0454, "step": 4250 }, { "epoch": 0.05, "learning_rate": 0.0002930920412531621, "loss": 0.0483, "step": 4260 }, { "epoch": 0.05, "learning_rate": 0.00029307582538755914, "loss": 0.049, "step": 4270 }, { "epoch": 0.05, "learning_rate": 0.00029305960952195626, "loss": 0.0488, "step": 4280 }, { "epoch": 0.05, "learning_rate": 0.00029304339365635333, "loss": 0.0539, "step": 4290 }, { "epoch": 0.05, "learning_rate": 0.00029302717779075045, "loss": 0.059, "step": 4300 }, { "epoch": 0.05, "learning_rate": 0.00029301096192514757, "loss": 0.0471, "step": 4310 }, { "epoch": 0.05, "learning_rate": 0.00029299474605954464, "loss": 0.0492, "step": 4320 }, { "epoch": 0.05, "learning_rate": 0.0002929785301939417, "loss": 0.0466, "step": 4330 }, { "epoch": 0.05, "learning_rate": 0.0002929623143283388, "loss": 0.0499, "step": 4340 }, { "epoch": 0.05, "learning_rate": 0.00029294609846273594, "loss": 0.0442, "step": 4350 }, { "epoch": 0.05, "learning_rate": 0.000292929882597133, "loss": 0.0472, "step": 4360 }, { "epoch": 0.05, "learning_rate": 0.00029291366673153007, "loss": 0.0456, "step": 4370 }, { "epoch": 0.05, "learning_rate": 0.0002928974508659272, "loss": 0.0503, "step": 4380 }, { "epoch": 0.05, "learning_rate": 0.0002928812350003243, "loss": 0.0479, "step": 4390 }, { "epoch": 0.05, "learning_rate": 0.0002928650191347214, "loss": 0.0441, "step": 4400 }, { "epoch": 0.05, "learning_rate": 0.0002928488032691185, "loss": 0.048, "step": 4410 }, { "epoch": 0.05, "learning_rate": 0.00029283258740351556, "loss": 0.04, "step": 4420 }, { "epoch": 0.05, "learning_rate": 0.0002928163715379127, "loss": 0.0527, "step": 4430 }, { "epoch": 0.05, "learning_rate": 0.0002928001556723098, "loss": 0.046, "step": 4440 }, { "epoch": 0.05, "learning_rate": 0.00029278393980670687, "loss": 0.0489, "step": 4450 }, { "epoch": 0.05, "learning_rate": 0.00029276772394110393, "loss": 0.0411, "step": 4460 }, { "epoch": 0.05, "learning_rate": 0.00029275150807550105, "loss": 0.0473, "step": 4470 }, { "epoch": 0.05, "learning_rate": 0.0002927352922098982, "loss": 0.0436, "step": 4480 }, { "epoch": 0.05, "learning_rate": 0.00029271907634429524, "loss": 0.0471, "step": 4490 }, { "epoch": 0.05, "learning_rate": 0.0002927028604786923, "loss": 0.0477, "step": 4500 }, { "epoch": 0.05, "learning_rate": 0.0002926866446130894, "loss": 0.0545, "step": 4510 }, { "epoch": 0.05, "learning_rate": 0.00029267042874748654, "loss": 0.0489, "step": 4520 }, { "epoch": 0.05, "learning_rate": 0.0002926542128818836, "loss": 0.0493, "step": 4530 }, { "epoch": 0.05, "learning_rate": 0.0002926379970162807, "loss": 0.049, "step": 4540 }, { "epoch": 0.05, "learning_rate": 0.0002926217811506778, "loss": 0.0423, "step": 4550 }, { "epoch": 0.05, "learning_rate": 0.0002926055652850749, "loss": 0.0466, "step": 4560 }, { "epoch": 0.05, "learning_rate": 0.000292589349419472, "loss": 0.051, "step": 4570 }, { "epoch": 0.05, "learning_rate": 0.0002925731335538691, "loss": 0.0509, "step": 4580 }, { "epoch": 0.05, "learning_rate": 0.00029255691768826617, "loss": 0.0412, "step": 4590 }, { "epoch": 0.05, "learning_rate": 0.0002925407018226633, "loss": 0.0459, "step": 4600 }, { "epoch": 0.05, "learning_rate": 0.00029252448595706035, "loss": 0.0398, "step": 4610 }, { "epoch": 0.05, "learning_rate": 0.00029250827009145747, "loss": 0.0373, "step": 4620 }, { "epoch": 0.05, "learning_rate": 0.00029249205422585454, "loss": 0.0445, "step": 4630 }, { "epoch": 0.05, "learning_rate": 0.00029247583836025166, "loss": 0.0438, "step": 4640 }, { "epoch": 0.05, "learning_rate": 0.0002924596224946487, "loss": 0.0398, "step": 4650 }, { "epoch": 0.05, "learning_rate": 0.00029244340662904584, "loss": 0.0407, "step": 4660 }, { "epoch": 0.05, "learning_rate": 0.0002924271907634429, "loss": 0.0467, "step": 4670 }, { "epoch": 0.05, "learning_rate": 0.00029241097489784003, "loss": 0.0414, "step": 4680 }, { "epoch": 0.05, "learning_rate": 0.0002923947590322371, "loss": 0.0451, "step": 4690 }, { "epoch": 0.05, "learning_rate": 0.0002923785431666342, "loss": 0.0493, "step": 4700 }, { "epoch": 0.05, "learning_rate": 0.00029236232730103133, "loss": 0.0478, "step": 4710 }, { "epoch": 0.05, "learning_rate": 0.0002923461114354284, "loss": 0.0434, "step": 4720 }, { "epoch": 0.05, "learning_rate": 0.00029232989556982546, "loss": 0.0426, "step": 4730 }, { "epoch": 0.05, "learning_rate": 0.0002923136797042226, "loss": 0.042, "step": 4740 }, { "epoch": 0.05, "learning_rate": 0.0002922974638386197, "loss": 0.045, "step": 4750 }, { "epoch": 0.05, "learning_rate": 0.00029228124797301677, "loss": 0.0395, "step": 4760 }, { "epoch": 0.05, "learning_rate": 0.00029226503210741384, "loss": 0.0432, "step": 4770 }, { "epoch": 0.05, "learning_rate": 0.00029224881624181096, "loss": 0.0433, "step": 4780 }, { "epoch": 0.05, "learning_rate": 0.0002922326003762081, "loss": 0.0499, "step": 4790 }, { "epoch": 0.05, "learning_rate": 0.00029221638451060514, "loss": 0.0486, "step": 4800 }, { "epoch": 0.05, "learning_rate": 0.0002922001686450022, "loss": 0.0388, "step": 4810 }, { "epoch": 0.05, "learning_rate": 0.0002921839527793993, "loss": 0.0411, "step": 4820 }, { "epoch": 0.05, "learning_rate": 0.00029216773691379645, "loss": 0.0402, "step": 4830 }, { "epoch": 0.05, "learning_rate": 0.0002921515210481935, "loss": 0.0417, "step": 4840 }, { "epoch": 0.05, "learning_rate": 0.00029213530518259063, "loss": 0.0431, "step": 4850 }, { "epoch": 0.05, "learning_rate": 0.0002921190893169877, "loss": 0.0408, "step": 4860 }, { "epoch": 0.05, "learning_rate": 0.0002921028734513848, "loss": 0.0398, "step": 4870 }, { "epoch": 0.05, "learning_rate": 0.00029208665758578194, "loss": 0.0566, "step": 4880 }, { "epoch": 0.05, "learning_rate": 0.000292070441720179, "loss": 0.0453, "step": 4890 }, { "epoch": 0.05, "learning_rate": 0.00029205422585457607, "loss": 0.044, "step": 4900 }, { "epoch": 0.05, "learning_rate": 0.0002920380099889732, "loss": 0.0461, "step": 4910 }, { "epoch": 0.05, "learning_rate": 0.0002920217941233703, "loss": 0.0415, "step": 4920 }, { "epoch": 0.05, "learning_rate": 0.0002920055782577674, "loss": 0.0386, "step": 4930 }, { "epoch": 0.05, "learning_rate": 0.00029198936239216444, "loss": 0.0555, "step": 4940 }, { "epoch": 0.05, "learning_rate": 0.00029197314652656156, "loss": 0.046, "step": 4950 }, { "epoch": 0.05, "learning_rate": 0.0002919569306609587, "loss": 0.0481, "step": 4960 }, { "epoch": 0.05, "learning_rate": 0.00029194071479535574, "loss": 0.0429, "step": 4970 }, { "epoch": 0.05, "learning_rate": 0.0002919244989297528, "loss": 0.0439, "step": 4980 }, { "epoch": 0.05, "learning_rate": 0.00029190828306414993, "loss": 0.0493, "step": 4990 }, { "epoch": 0.05, "learning_rate": 0.00029189206719854705, "loss": 0.0416, "step": 5000 }, { "epoch": 0.05, "eval_cer": 0.9216007657603663, "eval_loss": 0.03539329394698143, "eval_runtime": 120.0814, "eval_samples_per_second": 16.655, "eval_steps_per_second": 4.164, "step": 5000 }, { "epoch": 0.05, "learning_rate": 0.0002918758513329441, "loss": 0.0472, "step": 5010 }, { "epoch": 0.05, "learning_rate": 0.00029185963546734124, "loss": 0.0482, "step": 5020 }, { "epoch": 0.05, "learning_rate": 0.0002918434196017383, "loss": 0.0447, "step": 5030 }, { "epoch": 0.05, "learning_rate": 0.0002918272037361354, "loss": 0.0431, "step": 5040 }, { "epoch": 0.05, "learning_rate": 0.00029181098787053254, "loss": 0.0441, "step": 5050 }, { "epoch": 0.05, "learning_rate": 0.0002917947720049296, "loss": 0.0499, "step": 5060 }, { "epoch": 0.05, "learning_rate": 0.00029177855613932667, "loss": 0.0428, "step": 5070 }, { "epoch": 0.05, "learning_rate": 0.0002917623402737238, "loss": 0.0488, "step": 5080 }, { "epoch": 0.06, "learning_rate": 0.0002917461244081209, "loss": 0.0466, "step": 5090 }, { "epoch": 0.06, "learning_rate": 0.000291729908542518, "loss": 0.0459, "step": 5100 }, { "epoch": 0.06, "learning_rate": 0.00029171369267691504, "loss": 0.0492, "step": 5110 }, { "epoch": 0.06, "learning_rate": 0.00029169747681131216, "loss": 0.0482, "step": 5120 }, { "epoch": 0.06, "learning_rate": 0.0002916812609457093, "loss": 0.0454, "step": 5130 }, { "epoch": 0.06, "learning_rate": 0.00029166504508010635, "loss": 0.0446, "step": 5140 }, { "epoch": 0.06, "learning_rate": 0.00029164882921450347, "loss": 0.0412, "step": 5150 }, { "epoch": 0.06, "learning_rate": 0.00029163261334890053, "loss": 0.042, "step": 5160 }, { "epoch": 0.06, "learning_rate": 0.00029161639748329765, "loss": 0.046, "step": 5170 }, { "epoch": 0.06, "learning_rate": 0.0002916001816176947, "loss": 0.0467, "step": 5180 }, { "epoch": 0.06, "learning_rate": 0.00029158396575209184, "loss": 0.0554, "step": 5190 }, { "epoch": 0.06, "learning_rate": 0.0002915677498864889, "loss": 0.0482, "step": 5200 }, { "epoch": 0.06, "learning_rate": 0.000291551534020886, "loss": 0.0492, "step": 5210 }, { "epoch": 0.06, "learning_rate": 0.0002915353181552831, "loss": 0.043, "step": 5220 }, { "epoch": 0.06, "learning_rate": 0.0002915191022896802, "loss": 0.0457, "step": 5230 }, { "epoch": 0.06, "learning_rate": 0.0002915028864240773, "loss": 0.0424, "step": 5240 }, { "epoch": 0.06, "learning_rate": 0.0002914866705584744, "loss": 0.0433, "step": 5250 }, { "epoch": 0.06, "learning_rate": 0.00029147045469287146, "loss": 0.0459, "step": 5260 }, { "epoch": 0.06, "learning_rate": 0.0002914542388272686, "loss": 0.0491, "step": 5270 }, { "epoch": 0.06, "learning_rate": 0.00029143802296166565, "loss": 0.0447, "step": 5280 }, { "epoch": 0.06, "learning_rate": 0.00029142180709606277, "loss": 0.0389, "step": 5290 }, { "epoch": 0.06, "learning_rate": 0.00029140559123045983, "loss": 0.0483, "step": 5300 }, { "epoch": 0.06, "learning_rate": 0.00029138937536485695, "loss": 0.0449, "step": 5310 }, { "epoch": 0.06, "learning_rate": 0.00029137315949925407, "loss": 0.0527, "step": 5320 }, { "epoch": 0.06, "learning_rate": 0.00029135694363365114, "loss": 0.0421, "step": 5330 }, { "epoch": 0.06, "learning_rate": 0.0002913407277680482, "loss": 0.0414, "step": 5340 }, { "epoch": 0.06, "learning_rate": 0.0002913245119024453, "loss": 0.0417, "step": 5350 }, { "epoch": 0.06, "learning_rate": 0.00029130829603684244, "loss": 0.0466, "step": 5360 }, { "epoch": 0.06, "learning_rate": 0.0002912920801712395, "loss": 0.0411, "step": 5370 }, { "epoch": 0.06, "learning_rate": 0.0002912758643056366, "loss": 0.0472, "step": 5380 }, { "epoch": 0.06, "learning_rate": 0.0002912596484400337, "loss": 0.0413, "step": 5390 }, { "epoch": 0.06, "learning_rate": 0.0002912434325744308, "loss": 0.0415, "step": 5400 }, { "epoch": 0.06, "learning_rate": 0.0002912272167088279, "loss": 0.0382, "step": 5410 }, { "epoch": 0.06, "learning_rate": 0.000291211000843225, "loss": 0.0447, "step": 5420 }, { "epoch": 0.06, "learning_rate": 0.00029119478497762207, "loss": 0.0448, "step": 5430 }, { "epoch": 0.06, "learning_rate": 0.0002911785691120192, "loss": 0.0493, "step": 5440 }, { "epoch": 0.06, "learning_rate": 0.0002911623532464163, "loss": 0.0477, "step": 5450 }, { "epoch": 0.06, "learning_rate": 0.00029114613738081337, "loss": 0.0433, "step": 5460 }, { "epoch": 0.06, "learning_rate": 0.00029112992151521044, "loss": 0.0509, "step": 5470 }, { "epoch": 0.06, "learning_rate": 0.00029111370564960756, "loss": 0.0432, "step": 5480 }, { "epoch": 0.06, "learning_rate": 0.0002910974897840047, "loss": 0.0506, "step": 5490 }, { "epoch": 0.06, "learning_rate": 0.00029108127391840174, "loss": 0.0524, "step": 5500 }, { "epoch": 0.06, "learning_rate": 0.0002910650580527988, "loss": 0.0488, "step": 5510 }, { "epoch": 0.06, "learning_rate": 0.0002910488421871959, "loss": 0.0429, "step": 5520 }, { "epoch": 0.06, "learning_rate": 0.00029103262632159305, "loss": 0.0477, "step": 5530 }, { "epoch": 0.06, "learning_rate": 0.0002910164104559901, "loss": 0.0474, "step": 5540 }, { "epoch": 0.06, "learning_rate": 0.0002910001945903872, "loss": 0.0439, "step": 5550 }, { "epoch": 0.06, "learning_rate": 0.0002909839787247843, "loss": 0.049, "step": 5560 }, { "epoch": 0.06, "learning_rate": 0.0002909677628591814, "loss": 0.0469, "step": 5570 }, { "epoch": 0.06, "learning_rate": 0.0002909515469935785, "loss": 0.044, "step": 5580 }, { "epoch": 0.06, "learning_rate": 0.0002909353311279756, "loss": 0.0446, "step": 5590 }, { "epoch": 0.06, "learning_rate": 0.00029091911526237267, "loss": 0.0424, "step": 5600 }, { "epoch": 0.06, "learning_rate": 0.0002909028993967698, "loss": 0.0494, "step": 5610 }, { "epoch": 0.06, "learning_rate": 0.00029088668353116685, "loss": 0.0461, "step": 5620 }, { "epoch": 0.06, "learning_rate": 0.000290870467665564, "loss": 0.0435, "step": 5630 }, { "epoch": 0.06, "learning_rate": 0.00029085425179996104, "loss": 0.0497, "step": 5640 }, { "epoch": 0.06, "learning_rate": 0.00029083803593435816, "loss": 0.0534, "step": 5650 }, { "epoch": 0.06, "learning_rate": 0.0002908218200687552, "loss": 0.0461, "step": 5660 }, { "epoch": 0.06, "learning_rate": 0.00029080560420315235, "loss": 0.05, "step": 5670 }, { "epoch": 0.06, "learning_rate": 0.0002907893883375494, "loss": 0.0438, "step": 5680 }, { "epoch": 0.06, "learning_rate": 0.00029077317247194653, "loss": 0.041, "step": 5690 }, { "epoch": 0.06, "learning_rate": 0.0002907569566063436, "loss": 0.0456, "step": 5700 }, { "epoch": 0.06, "learning_rate": 0.0002907407407407407, "loss": 0.0466, "step": 5710 }, { "epoch": 0.06, "learning_rate": 0.00029072452487513784, "loss": 0.0462, "step": 5720 }, { "epoch": 0.06, "learning_rate": 0.0002907083090095349, "loss": 0.0439, "step": 5730 }, { "epoch": 0.06, "learning_rate": 0.00029069209314393197, "loss": 0.0481, "step": 5740 }, { "epoch": 0.06, "learning_rate": 0.0002906758772783291, "loss": 0.0511, "step": 5750 }, { "epoch": 0.06, "learning_rate": 0.0002906596614127262, "loss": 0.0538, "step": 5760 }, { "epoch": 0.06, "learning_rate": 0.00029064344554712327, "loss": 0.0438, "step": 5770 }, { "epoch": 0.06, "learning_rate": 0.0002906272296815204, "loss": 0.0465, "step": 5780 }, { "epoch": 0.06, "learning_rate": 0.00029061101381591746, "loss": 0.0422, "step": 5790 }, { "epoch": 0.06, "learning_rate": 0.0002905947979503146, "loss": 0.046, "step": 5800 }, { "epoch": 0.06, "learning_rate": 0.00029057858208471164, "loss": 0.0476, "step": 5810 }, { "epoch": 0.06, "learning_rate": 0.00029056236621910876, "loss": 0.0465, "step": 5820 }, { "epoch": 0.06, "learning_rate": 0.00029054615035350583, "loss": 0.0452, "step": 5830 }, { "epoch": 0.06, "learning_rate": 0.00029052993448790295, "loss": 0.0539, "step": 5840 }, { "epoch": 0.06, "learning_rate": 0.0002905137186223, "loss": 0.0472, "step": 5850 }, { "epoch": 0.06, "learning_rate": 0.00029049750275669713, "loss": 0.0496, "step": 5860 }, { "epoch": 0.06, "learning_rate": 0.0002904812868910942, "loss": 0.0466, "step": 5870 }, { "epoch": 0.06, "learning_rate": 0.0002904650710254913, "loss": 0.0423, "step": 5880 }, { "epoch": 0.06, "learning_rate": 0.00029044885515988844, "loss": 0.0423, "step": 5890 }, { "epoch": 0.06, "learning_rate": 0.0002904326392942855, "loss": 0.0551, "step": 5900 }, { "epoch": 0.06, "learning_rate": 0.00029041642342868257, "loss": 0.0518, "step": 5910 }, { "epoch": 0.06, "learning_rate": 0.0002904002075630797, "loss": 0.0499, "step": 5920 }, { "epoch": 0.06, "learning_rate": 0.0002903839916974768, "loss": 0.0686, "step": 5930 }, { "epoch": 0.06, "learning_rate": 0.0002903677758318739, "loss": 0.0467, "step": 5940 }, { "epoch": 0.06, "learning_rate": 0.00029035155996627094, "loss": 0.044, "step": 5950 }, { "epoch": 0.06, "learning_rate": 0.00029033534410066806, "loss": 0.0512, "step": 5960 }, { "epoch": 0.06, "learning_rate": 0.0002903191282350652, "loss": 0.0445, "step": 5970 }, { "epoch": 0.06, "learning_rate": 0.00029030291236946225, "loss": 0.0489, "step": 5980 }, { "epoch": 0.06, "learning_rate": 0.0002902866965038593, "loss": 0.0366, "step": 5990 }, { "epoch": 0.06, "learning_rate": 0.00029027048063825643, "loss": 0.0433, "step": 6000 }, { "epoch": 0.06, "eval_cer": 0.9216250866431449, "eval_loss": 0.033627625554800034, "eval_runtime": 121.2057, "eval_samples_per_second": 16.501, "eval_steps_per_second": 4.125, "step": 6000 }, { "epoch": 0.06, "learning_rate": 0.00029025426477265355, "loss": 0.0386, "step": 6010 }, { "epoch": 0.07, "learning_rate": 0.00029023804890705067, "loss": 0.0464, "step": 6020 }, { "epoch": 0.07, "learning_rate": 0.00029022183304144774, "loss": 0.0433, "step": 6030 }, { "epoch": 0.07, "learning_rate": 0.0002902056171758448, "loss": 0.0471, "step": 6040 }, { "epoch": 0.07, "learning_rate": 0.0002901894013102419, "loss": 0.0426, "step": 6050 }, { "epoch": 0.07, "learning_rate": 0.00029017318544463904, "loss": 0.0427, "step": 6060 }, { "epoch": 0.07, "learning_rate": 0.0002901569695790361, "loss": 0.0403, "step": 6070 }, { "epoch": 0.07, "learning_rate": 0.0002901407537134332, "loss": 0.0447, "step": 6080 }, { "epoch": 0.07, "learning_rate": 0.0002901245378478303, "loss": 0.044, "step": 6090 }, { "epoch": 0.07, "learning_rate": 0.0002901083219822274, "loss": 0.0468, "step": 6100 }, { "epoch": 0.07, "learning_rate": 0.0002900921061166245, "loss": 0.0402, "step": 6110 }, { "epoch": 0.07, "learning_rate": 0.00029007589025102155, "loss": 0.0405, "step": 6120 }, { "epoch": 0.07, "learning_rate": 0.00029005967438541867, "loss": 0.0496, "step": 6130 }, { "epoch": 0.07, "learning_rate": 0.0002900434585198158, "loss": 0.0491, "step": 6140 }, { "epoch": 0.07, "learning_rate": 0.00029002724265421285, "loss": 0.0556, "step": 6150 }, { "epoch": 0.07, "learning_rate": 0.00029001102678860997, "loss": 0.0431, "step": 6160 }, { "epoch": 0.07, "learning_rate": 0.00028999481092300704, "loss": 0.0403, "step": 6170 }, { "epoch": 0.07, "learning_rate": 0.00028997859505740416, "loss": 0.0448, "step": 6180 }, { "epoch": 0.07, "learning_rate": 0.0002899623791918012, "loss": 0.0421, "step": 6190 }, { "epoch": 0.07, "learning_rate": 0.00028994616332619834, "loss": 0.0453, "step": 6200 }, { "epoch": 0.07, "learning_rate": 0.0002899299474605954, "loss": 0.0418, "step": 6210 }, { "epoch": 0.07, "learning_rate": 0.00028991373159499253, "loss": 0.0475, "step": 6220 }, { "epoch": 0.07, "learning_rate": 0.0002898975157293896, "loss": 0.0407, "step": 6230 }, { "epoch": 0.07, "learning_rate": 0.0002898812998637867, "loss": 0.046, "step": 6240 }, { "epoch": 0.07, "learning_rate": 0.0002898650839981838, "loss": 0.0442, "step": 6250 }, { "epoch": 0.07, "learning_rate": 0.0002898488681325809, "loss": 0.0435, "step": 6260 }, { "epoch": 0.07, "learning_rate": 0.00028983265226697796, "loss": 0.0422, "step": 6270 }, { "epoch": 0.07, "learning_rate": 0.0002898164364013751, "loss": 0.0409, "step": 6280 }, { "epoch": 0.07, "learning_rate": 0.00028980022053577215, "loss": 0.041, "step": 6290 }, { "epoch": 0.07, "learning_rate": 0.00028978400467016927, "loss": 0.0356, "step": 6300 }, { "epoch": 0.07, "learning_rate": 0.00028976778880456634, "loss": 0.0383, "step": 6310 }, { "epoch": 0.07, "learning_rate": 0.00028975157293896345, "loss": 0.0382, "step": 6320 }, { "epoch": 0.07, "learning_rate": 0.0002897353570733606, "loss": 0.0409, "step": 6330 }, { "epoch": 0.07, "learning_rate": 0.00028971914120775764, "loss": 0.0401, "step": 6340 }, { "epoch": 0.07, "learning_rate": 0.0002897029253421547, "loss": 0.0427, "step": 6350 }, { "epoch": 0.07, "learning_rate": 0.0002896867094765518, "loss": 0.0416, "step": 6360 }, { "epoch": 0.07, "learning_rate": 0.00028967049361094895, "loss": 0.0402, "step": 6370 }, { "epoch": 0.07, "learning_rate": 0.000289654277745346, "loss": 0.0507, "step": 6380 }, { "epoch": 0.07, "learning_rate": 0.0002896380618797431, "loss": 0.0411, "step": 6390 }, { "epoch": 0.07, "learning_rate": 0.0002896218460141402, "loss": 0.0436, "step": 6400 }, { "epoch": 0.07, "learning_rate": 0.0002896056301485373, "loss": 0.043, "step": 6410 }, { "epoch": 0.07, "learning_rate": 0.0002895894142829344, "loss": 0.0404, "step": 6420 }, { "epoch": 0.07, "learning_rate": 0.0002895731984173315, "loss": 0.0423, "step": 6430 }, { "epoch": 0.07, "learning_rate": 0.00028955698255172857, "loss": 0.0436, "step": 6440 }, { "epoch": 0.07, "learning_rate": 0.0002895407666861257, "loss": 0.0377, "step": 6450 }, { "epoch": 0.07, "learning_rate": 0.0002895245508205228, "loss": 0.0412, "step": 6460 }, { "epoch": 0.07, "learning_rate": 0.0002895083349549199, "loss": 0.0372, "step": 6470 }, { "epoch": 0.07, "learning_rate": 0.00028949211908931694, "loss": 0.0448, "step": 6480 }, { "epoch": 0.07, "learning_rate": 0.00028947590322371406, "loss": 0.0421, "step": 6490 }, { "epoch": 0.07, "learning_rate": 0.0002894596873581112, "loss": 0.0396, "step": 6500 }, { "epoch": 0.07, "learning_rate": 0.00028944347149250824, "loss": 0.0402, "step": 6510 }, { "epoch": 0.07, "learning_rate": 0.0002894272556269053, "loss": 0.0447, "step": 6520 }, { "epoch": 0.07, "learning_rate": 0.00028941103976130243, "loss": 0.0376, "step": 6530 }, { "epoch": 0.07, "learning_rate": 0.00028939482389569955, "loss": 0.046, "step": 6540 }, { "epoch": 0.07, "learning_rate": 0.0002893786080300966, "loss": 0.04, "step": 6550 }, { "epoch": 0.07, "learning_rate": 0.0002893623921644937, "loss": 0.0441, "step": 6560 }, { "epoch": 0.07, "learning_rate": 0.0002893461762988908, "loss": 0.0379, "step": 6570 }, { "epoch": 0.07, "learning_rate": 0.0002893299604332879, "loss": 0.0483, "step": 6580 }, { "epoch": 0.07, "learning_rate": 0.000289313744567685, "loss": 0.0427, "step": 6590 }, { "epoch": 0.07, "learning_rate": 0.0002892975287020821, "loss": 0.0446, "step": 6600 }, { "epoch": 0.07, "learning_rate": 0.00028928131283647917, "loss": 0.0445, "step": 6610 }, { "epoch": 0.07, "learning_rate": 0.0002892650969708763, "loss": 0.0454, "step": 6620 }, { "epoch": 0.07, "learning_rate": 0.0002892488811052734, "loss": 0.0423, "step": 6630 }, { "epoch": 0.07, "learning_rate": 0.0002892326652396705, "loss": 0.0465, "step": 6640 }, { "epoch": 0.07, "learning_rate": 0.00028921644937406754, "loss": 0.0435, "step": 6650 }, { "epoch": 0.07, "learning_rate": 0.00028920023350846466, "loss": 0.0428, "step": 6660 }, { "epoch": 0.07, "learning_rate": 0.0002891840176428618, "loss": 0.041, "step": 6670 }, { "epoch": 0.07, "learning_rate": 0.00028916780177725885, "loss": 0.0383, "step": 6680 }, { "epoch": 0.07, "learning_rate": 0.0002891515859116559, "loss": 0.0424, "step": 6690 }, { "epoch": 0.07, "learning_rate": 0.00028913537004605303, "loss": 0.0369, "step": 6700 }, { "epoch": 0.07, "learning_rate": 0.00028911915418045015, "loss": 0.0459, "step": 6710 }, { "epoch": 0.07, "learning_rate": 0.0002891029383148472, "loss": 0.0438, "step": 6720 }, { "epoch": 0.07, "learning_rate": 0.00028908672244924434, "loss": 0.0379, "step": 6730 }, { "epoch": 0.07, "learning_rate": 0.0002890705065836414, "loss": 0.0418, "step": 6740 }, { "epoch": 0.07, "learning_rate": 0.0002890542907180385, "loss": 0.0438, "step": 6750 }, { "epoch": 0.07, "learning_rate": 0.0002890380748524356, "loss": 0.0431, "step": 6760 }, { "epoch": 0.07, "learning_rate": 0.0002890218589868327, "loss": 0.0471, "step": 6770 }, { "epoch": 0.07, "learning_rate": 0.0002890056431212298, "loss": 0.0387, "step": 6780 }, { "epoch": 0.07, "learning_rate": 0.0002889894272556269, "loss": 0.0363, "step": 6790 }, { "epoch": 0.07, "learning_rate": 0.00028897321139002396, "loss": 0.0371, "step": 6800 }, { "epoch": 0.07, "learning_rate": 0.0002889569955244211, "loss": 0.0421, "step": 6810 }, { "epoch": 0.07, "learning_rate": 0.00028894077965881815, "loss": 0.0421, "step": 6820 }, { "epoch": 0.07, "learning_rate": 0.00028892456379321527, "loss": 0.0368, "step": 6830 }, { "epoch": 0.07, "learning_rate": 0.00028890834792761233, "loss": 0.0374, "step": 6840 }, { "epoch": 0.07, "learning_rate": 0.00028889213206200945, "loss": 0.0407, "step": 6850 }, { "epoch": 0.07, "learning_rate": 0.0002888759161964065, "loss": 0.0466, "step": 6860 }, { "epoch": 0.07, "learning_rate": 0.00028885970033080364, "loss": 0.0418, "step": 6870 }, { "epoch": 0.07, "learning_rate": 0.0002888434844652007, "loss": 0.0449, "step": 6880 }, { "epoch": 0.07, "learning_rate": 0.0002888272685995978, "loss": 0.0395, "step": 6890 }, { "epoch": 0.07, "learning_rate": 0.00028881105273399494, "loss": 0.0423, "step": 6900 }, { "epoch": 0.07, "learning_rate": 0.000288794836868392, "loss": 0.0399, "step": 6910 }, { "epoch": 0.07, "learning_rate": 0.0002887786210027891, "loss": 0.0372, "step": 6920 }, { "epoch": 0.07, "learning_rate": 0.0002887624051371862, "loss": 0.0448, "step": 6930 }, { "epoch": 0.08, "learning_rate": 0.0002887461892715833, "loss": 0.0411, "step": 6940 }, { "epoch": 0.08, "learning_rate": 0.0002887299734059804, "loss": 0.0476, "step": 6950 }, { "epoch": 0.08, "learning_rate": 0.00028871375754037744, "loss": 0.0365, "step": 6960 }, { "epoch": 0.08, "learning_rate": 0.00028869754167477456, "loss": 0.0408, "step": 6970 }, { "epoch": 0.08, "learning_rate": 0.0002886813258091717, "loss": 0.0426, "step": 6980 }, { "epoch": 0.08, "learning_rate": 0.00028866510994356875, "loss": 0.0357, "step": 6990 }, { "epoch": 0.08, "learning_rate": 0.0002886488940779658, "loss": 0.045, "step": 7000 }, { "epoch": 0.08, "eval_cer": 0.9216294296579268, "eval_loss": 0.03147590905427933, "eval_runtime": 120.5116, "eval_samples_per_second": 16.596, "eval_steps_per_second": 4.149, "step": 7000 }, { "epoch": 0.08, "learning_rate": 0.00028863267821236294, "loss": 0.0435, "step": 7010 }, { "epoch": 0.08, "learning_rate": 0.00028861646234676006, "loss": 0.0446, "step": 7020 }, { "epoch": 0.08, "learning_rate": 0.0002886002464811572, "loss": 0.0447, "step": 7030 }, { "epoch": 0.08, "learning_rate": 0.00028858403061555424, "loss": 0.0341, "step": 7040 }, { "epoch": 0.08, "learning_rate": 0.0002885678147499513, "loss": 0.0362, "step": 7050 }, { "epoch": 0.08, "learning_rate": 0.0002885515988843484, "loss": 0.0411, "step": 7060 }, { "epoch": 0.08, "learning_rate": 0.00028853538301874555, "loss": 0.0467, "step": 7070 }, { "epoch": 0.08, "learning_rate": 0.0002885191671531426, "loss": 0.0403, "step": 7080 }, { "epoch": 0.08, "learning_rate": 0.0002885029512875397, "loss": 0.0409, "step": 7090 }, { "epoch": 0.08, "learning_rate": 0.0002884867354219368, "loss": 0.0412, "step": 7100 }, { "epoch": 0.08, "learning_rate": 0.0002884705195563339, "loss": 0.0408, "step": 7110 }, { "epoch": 0.08, "learning_rate": 0.000288454303690731, "loss": 0.0475, "step": 7120 }, { "epoch": 0.08, "learning_rate": 0.00028843808782512805, "loss": 0.0398, "step": 7130 }, { "epoch": 0.08, "learning_rate": 0.00028842187195952517, "loss": 0.0436, "step": 7140 }, { "epoch": 0.08, "learning_rate": 0.0002884056560939223, "loss": 0.0405, "step": 7150 }, { "epoch": 0.08, "learning_rate": 0.00028838944022831935, "loss": 0.0405, "step": 7160 }, { "epoch": 0.08, "learning_rate": 0.0002883732243627165, "loss": 0.0364, "step": 7170 }, { "epoch": 0.08, "learning_rate": 0.00028835700849711354, "loss": 0.037, "step": 7180 }, { "epoch": 0.08, "learning_rate": 0.00028834079263151066, "loss": 0.0437, "step": 7190 }, { "epoch": 0.08, "learning_rate": 0.0002883245767659078, "loss": 0.0445, "step": 7200 }, { "epoch": 0.08, "learning_rate": 0.00028830836090030484, "loss": 0.0442, "step": 7210 }, { "epoch": 0.08, "learning_rate": 0.0002882921450347019, "loss": 0.0418, "step": 7220 }, { "epoch": 0.08, "learning_rate": 0.00028827592916909903, "loss": 0.0386, "step": 7230 }, { "epoch": 0.08, "learning_rate": 0.00028825971330349615, "loss": 0.035, "step": 7240 }, { "epoch": 0.08, "learning_rate": 0.0002882434974378932, "loss": 0.0475, "step": 7250 }, { "epoch": 0.08, "learning_rate": 0.0002882272815722903, "loss": 0.0443, "step": 7260 }, { "epoch": 0.08, "learning_rate": 0.0002882110657066874, "loss": 0.0397, "step": 7270 }, { "epoch": 0.08, "learning_rate": 0.0002881948498410845, "loss": 0.04, "step": 7280 }, { "epoch": 0.08, "learning_rate": 0.0002881786339754816, "loss": 0.0455, "step": 7290 }, { "epoch": 0.08, "learning_rate": 0.00028816241810987865, "loss": 0.0381, "step": 7300 }, { "epoch": 0.08, "learning_rate": 0.00028814620224427577, "loss": 0.0367, "step": 7310 }, { "epoch": 0.08, "learning_rate": 0.0002881299863786729, "loss": 0.04, "step": 7320 }, { "epoch": 0.08, "learning_rate": 0.00028811377051306996, "loss": 0.0424, "step": 7330 }, { "epoch": 0.08, "learning_rate": 0.0002880975546474671, "loss": 0.0459, "step": 7340 }, { "epoch": 0.08, "learning_rate": 0.00028808133878186414, "loss": 0.0368, "step": 7350 }, { "epoch": 0.08, "learning_rate": 0.00028806512291626126, "loss": 0.0415, "step": 7360 }, { "epoch": 0.08, "learning_rate": 0.00028804890705065833, "loss": 0.0438, "step": 7370 }, { "epoch": 0.08, "learning_rate": 0.00028803269118505545, "loss": 0.0513, "step": 7380 }, { "epoch": 0.08, "learning_rate": 0.0002880164753194525, "loss": 0.0311, "step": 7390 }, { "epoch": 0.08, "learning_rate": 0.00028800025945384963, "loss": 0.0439, "step": 7400 }, { "epoch": 0.08, "learning_rate": 0.0002879840435882467, "loss": 0.046, "step": 7410 }, { "epoch": 0.08, "learning_rate": 0.0002879678277226438, "loss": 0.0427, "step": 7420 }, { "epoch": 0.08, "learning_rate": 0.0002879516118570409, "loss": 0.0415, "step": 7430 }, { "epoch": 0.08, "learning_rate": 0.000287935395991438, "loss": 0.0494, "step": 7440 }, { "epoch": 0.08, "learning_rate": 0.00028791918012583507, "loss": 0.0359, "step": 7450 }, { "epoch": 0.08, "learning_rate": 0.0002879029642602322, "loss": 0.0415, "step": 7460 }, { "epoch": 0.08, "learning_rate": 0.0002878867483946293, "loss": 0.0451, "step": 7470 }, { "epoch": 0.08, "learning_rate": 0.0002878705325290264, "loss": 0.0517, "step": 7480 }, { "epoch": 0.08, "learning_rate": 0.00028785431666342344, "loss": 0.0418, "step": 7490 }, { "epoch": 0.08, "learning_rate": 0.00028783810079782056, "loss": 0.0431, "step": 7500 }, { "epoch": 0.08, "learning_rate": 0.0002878218849322177, "loss": 0.0654, "step": 7510 }, { "epoch": 0.08, "learning_rate": 0.00028780566906661475, "loss": 0.0419, "step": 7520 }, { "epoch": 0.08, "learning_rate": 0.0002877894532010118, "loss": 0.0428, "step": 7530 }, { "epoch": 0.08, "learning_rate": 0.00028777323733540893, "loss": 0.0423, "step": 7540 }, { "epoch": 0.08, "learning_rate": 0.00028775702146980605, "loss": 0.0395, "step": 7550 }, { "epoch": 0.08, "learning_rate": 0.0002877408056042031, "loss": 0.0416, "step": 7560 }, { "epoch": 0.08, "learning_rate": 0.0002877245897386002, "loss": 0.0433, "step": 7570 }, { "epoch": 0.08, "learning_rate": 0.0002877083738729973, "loss": 0.0476, "step": 7580 }, { "epoch": 0.08, "learning_rate": 0.0002876921580073944, "loss": 0.0383, "step": 7590 }, { "epoch": 0.08, "learning_rate": 0.0002876759421417915, "loss": 0.0446, "step": 7600 }, { "epoch": 0.08, "learning_rate": 0.0002876597262761886, "loss": 0.0447, "step": 7610 }, { "epoch": 0.08, "learning_rate": 0.0002876435104105857, "loss": 0.0401, "step": 7620 }, { "epoch": 0.08, "learning_rate": 0.0002876272945449828, "loss": 0.0409, "step": 7630 }, { "epoch": 0.08, "learning_rate": 0.0002876110786793799, "loss": 0.0411, "step": 7640 }, { "epoch": 0.08, "learning_rate": 0.000287594862813777, "loss": 0.0378, "step": 7650 }, { "epoch": 0.08, "learning_rate": 0.00028757864694817405, "loss": 0.0465, "step": 7660 }, { "epoch": 0.08, "learning_rate": 0.00028756243108257117, "loss": 0.0413, "step": 7670 }, { "epoch": 0.08, "learning_rate": 0.0002875462152169683, "loss": 0.0387, "step": 7680 }, { "epoch": 0.08, "learning_rate": 0.00028752999935136535, "loss": 0.049, "step": 7690 }, { "epoch": 0.08, "learning_rate": 0.0002875137834857624, "loss": 0.0463, "step": 7700 }, { "epoch": 0.08, "learning_rate": 0.00028749756762015954, "loss": 0.0371, "step": 7710 }, { "epoch": 0.08, "learning_rate": 0.00028748135175455666, "loss": 0.0403, "step": 7720 }, { "epoch": 0.08, "learning_rate": 0.0002874651358889537, "loss": 0.0415, "step": 7730 }, { "epoch": 0.08, "learning_rate": 0.00028744892002335084, "loss": 0.0452, "step": 7740 }, { "epoch": 0.08, "learning_rate": 0.0002874327041577479, "loss": 0.0383, "step": 7750 }, { "epoch": 0.08, "learning_rate": 0.000287416488292145, "loss": 0.0394, "step": 7760 }, { "epoch": 0.08, "learning_rate": 0.0002874002724265421, "loss": 0.0362, "step": 7770 }, { "epoch": 0.08, "learning_rate": 0.0002873840565609392, "loss": 0.043, "step": 7780 }, { "epoch": 0.08, "learning_rate": 0.0002873678406953363, "loss": 0.0395, "step": 7790 }, { "epoch": 0.08, "learning_rate": 0.0002873516248297334, "loss": 0.0391, "step": 7800 }, { "epoch": 0.08, "learning_rate": 0.00028733540896413046, "loss": 0.0403, "step": 7810 }, { "epoch": 0.08, "learning_rate": 0.0002873191930985276, "loss": 0.0384, "step": 7820 }, { "epoch": 0.08, "learning_rate": 0.00028730297723292465, "loss": 0.0396, "step": 7830 }, { "epoch": 0.08, "learning_rate": 0.00028728676136732177, "loss": 0.0361, "step": 7840 }, { "epoch": 0.08, "learning_rate": 0.00028727054550171883, "loss": 0.0409, "step": 7850 }, { "epoch": 0.08, "learning_rate": 0.00028725432963611595, "loss": 0.0379, "step": 7860 }, { "epoch": 0.09, "learning_rate": 0.000287238113770513, "loss": 0.0418, "step": 7870 }, { "epoch": 0.09, "learning_rate": 0.00028722189790491014, "loss": 0.0424, "step": 7880 }, { "epoch": 0.09, "learning_rate": 0.0002872056820393072, "loss": 0.0422, "step": 7890 }, { "epoch": 0.09, "learning_rate": 0.0002871894661737043, "loss": 0.0484, "step": 7900 }, { "epoch": 0.09, "learning_rate": 0.00028717325030810145, "loss": 0.0437, "step": 7910 }, { "epoch": 0.09, "learning_rate": 0.0002871570344424985, "loss": 0.0362, "step": 7920 }, { "epoch": 0.09, "learning_rate": 0.00028714081857689563, "loss": 0.0387, "step": 7930 }, { "epoch": 0.09, "learning_rate": 0.0002871246027112927, "loss": 0.0394, "step": 7940 }, { "epoch": 0.09, "learning_rate": 0.0002871083868456898, "loss": 0.0425, "step": 7950 }, { "epoch": 0.09, "learning_rate": 0.0002870921709800869, "loss": 0.0481, "step": 7960 }, { "epoch": 0.09, "learning_rate": 0.000287075955114484, "loss": 0.0438, "step": 7970 }, { "epoch": 0.09, "learning_rate": 0.00028705973924888107, "loss": 0.0413, "step": 7980 }, { "epoch": 0.09, "learning_rate": 0.0002870435233832782, "loss": 0.0447, "step": 7990 }, { "epoch": 0.09, "learning_rate": 0.00028702730751767525, "loss": 0.0452, "step": 8000 }, { "epoch": 0.09, "eval_cer": 0.9215668902450677, "eval_loss": 0.03050500527024269, "eval_runtime": 119.8198, "eval_samples_per_second": 16.692, "eval_steps_per_second": 4.173, "step": 8000 }, { "epoch": 0.09, "learning_rate": 0.00028701109165207237, "loss": 0.0518, "step": 8010 }, { "epoch": 0.09, "learning_rate": 0.00028699487578646944, "loss": 0.0419, "step": 8020 }, { "epoch": 0.09, "learning_rate": 0.00028697865992086656, "loss": 0.0416, "step": 8030 }, { "epoch": 0.09, "learning_rate": 0.0002869624440552637, "loss": 0.0452, "step": 8040 }, { "epoch": 0.09, "learning_rate": 0.00028694622818966074, "loss": 0.0394, "step": 8050 }, { "epoch": 0.09, "learning_rate": 0.0002869300123240578, "loss": 0.0382, "step": 8060 }, { "epoch": 0.09, "learning_rate": 0.00028691379645845493, "loss": 0.0397, "step": 8070 }, { "epoch": 0.09, "learning_rate": 0.00028689758059285205, "loss": 0.0354, "step": 8080 }, { "epoch": 0.09, "learning_rate": 0.0002868813647272491, "loss": 0.0351, "step": 8090 }, { "epoch": 0.09, "learning_rate": 0.0002868651488616462, "loss": 0.0386, "step": 8100 }, { "epoch": 0.09, "learning_rate": 0.0002868489329960433, "loss": 0.0413, "step": 8110 }, { "epoch": 0.09, "learning_rate": 0.0002868327171304404, "loss": 0.0391, "step": 8120 }, { "epoch": 0.09, "learning_rate": 0.0002868165012648375, "loss": 0.041, "step": 8130 }, { "epoch": 0.09, "learning_rate": 0.00028680028539923455, "loss": 0.0412, "step": 8140 }, { "epoch": 0.09, "learning_rate": 0.00028678406953363167, "loss": 0.0409, "step": 8150 }, { "epoch": 0.09, "learning_rate": 0.0002867678536680288, "loss": 0.0415, "step": 8160 }, { "epoch": 0.09, "learning_rate": 0.00028675163780242586, "loss": 0.0429, "step": 8170 }, { "epoch": 0.09, "learning_rate": 0.000286735421936823, "loss": 0.0384, "step": 8180 }, { "epoch": 0.09, "learning_rate": 0.00028671920607122004, "loss": 0.0387, "step": 8190 }, { "epoch": 0.09, "learning_rate": 0.00028670299020561716, "loss": 0.0399, "step": 8200 }, { "epoch": 0.09, "learning_rate": 0.0002866867743400143, "loss": 0.0387, "step": 8210 }, { "epoch": 0.09, "learning_rate": 0.00028667055847441135, "loss": 0.0371, "step": 8220 }, { "epoch": 0.09, "learning_rate": 0.0002866543426088084, "loss": 0.0357, "step": 8230 }, { "epoch": 0.09, "learning_rate": 0.00028663812674320553, "loss": 0.0426, "step": 8240 }, { "epoch": 0.09, "learning_rate": 0.00028662191087760265, "loss": 0.0356, "step": 8250 }, { "epoch": 0.09, "learning_rate": 0.0002866056950119997, "loss": 0.0348, "step": 8260 }, { "epoch": 0.09, "learning_rate": 0.0002865894791463968, "loss": 0.0402, "step": 8270 }, { "epoch": 0.09, "learning_rate": 0.0002865732632807939, "loss": 0.0398, "step": 8280 }, { "epoch": 0.09, "learning_rate": 0.000286557047415191, "loss": 0.0357, "step": 8290 }, { "epoch": 0.09, "learning_rate": 0.0002865408315495881, "loss": 0.0335, "step": 8300 }, { "epoch": 0.09, "learning_rate": 0.00028652461568398515, "loss": 0.0421, "step": 8310 }, { "epoch": 0.09, "learning_rate": 0.0002865083998183823, "loss": 0.0378, "step": 8320 }, { "epoch": 0.09, "learning_rate": 0.0002864921839527794, "loss": 0.0373, "step": 8330 }, { "epoch": 0.09, "learning_rate": 0.00028647596808717646, "loss": 0.0373, "step": 8340 }, { "epoch": 0.09, "learning_rate": 0.0002864597522215736, "loss": 0.0401, "step": 8350 }, { "epoch": 0.09, "learning_rate": 0.00028644353635597065, "loss": 0.0374, "step": 8360 }, { "epoch": 0.09, "learning_rate": 0.00028642732049036777, "loss": 0.0376, "step": 8370 }, { "epoch": 0.09, "learning_rate": 0.00028641110462476483, "loss": 0.042, "step": 8380 }, { "epoch": 0.09, "learning_rate": 0.00028639488875916195, "loss": 0.0381, "step": 8390 }, { "epoch": 0.09, "learning_rate": 0.000286378672893559, "loss": 0.0379, "step": 8400 }, { "epoch": 0.09, "learning_rate": 0.00028636245702795614, "loss": 0.0375, "step": 8410 }, { "epoch": 0.09, "learning_rate": 0.0002863462411623532, "loss": 0.0402, "step": 8420 }, { "epoch": 0.09, "learning_rate": 0.0002863300252967503, "loss": 0.0355, "step": 8430 }, { "epoch": 0.09, "learning_rate": 0.0002863138094311474, "loss": 0.0405, "step": 8440 }, { "epoch": 0.09, "learning_rate": 0.0002862975935655445, "loss": 0.0385, "step": 8450 }, { "epoch": 0.09, "learning_rate": 0.0002862813776999416, "loss": 0.0409, "step": 8460 }, { "epoch": 0.09, "learning_rate": 0.0002862651618343387, "loss": 0.0316, "step": 8470 }, { "epoch": 0.09, "learning_rate": 0.0002862489459687358, "loss": 0.0402, "step": 8480 }, { "epoch": 0.09, "learning_rate": 0.0002862327301031329, "loss": 0.0355, "step": 8490 }, { "epoch": 0.09, "learning_rate": 0.00028621651423752994, "loss": 0.0357, "step": 8500 }, { "epoch": 0.09, "learning_rate": 0.00028620029837192706, "loss": 0.0396, "step": 8510 }, { "epoch": 0.09, "learning_rate": 0.0002861840825063242, "loss": 0.0371, "step": 8520 }, { "epoch": 0.09, "learning_rate": 0.00028616786664072125, "loss": 0.0418, "step": 8530 }, { "epoch": 0.09, "learning_rate": 0.0002861516507751183, "loss": 0.0414, "step": 8540 }, { "epoch": 0.09, "learning_rate": 0.00028613543490951543, "loss": 0.0383, "step": 8550 }, { "epoch": 0.09, "learning_rate": 0.00028611921904391255, "loss": 0.0455, "step": 8560 }, { "epoch": 0.09, "learning_rate": 0.0002861030031783096, "loss": 0.0417, "step": 8570 }, { "epoch": 0.09, "learning_rate": 0.0002860867873127067, "loss": 0.0404, "step": 8580 }, { "epoch": 0.09, "learning_rate": 0.0002860705714471038, "loss": 0.0327, "step": 8590 }, { "epoch": 0.09, "learning_rate": 0.0002860543555815009, "loss": 0.0338, "step": 8600 }, { "epoch": 0.09, "learning_rate": 0.000286038139715898, "loss": 0.0373, "step": 8610 }, { "epoch": 0.09, "learning_rate": 0.0002860219238502951, "loss": 0.0407, "step": 8620 }, { "epoch": 0.09, "learning_rate": 0.0002860057079846922, "loss": 0.0362, "step": 8630 }, { "epoch": 0.09, "learning_rate": 0.0002859894921190893, "loss": 0.0377, "step": 8640 }, { "epoch": 0.09, "learning_rate": 0.0002859732762534864, "loss": 0.0388, "step": 8650 }, { "epoch": 0.09, "learning_rate": 0.0002859570603878835, "loss": 0.0397, "step": 8660 }, { "epoch": 0.09, "learning_rate": 0.00028594084452228055, "loss": 0.0367, "step": 8670 }, { "epoch": 0.09, "learning_rate": 0.00028592462865667767, "loss": 0.0396, "step": 8680 }, { "epoch": 0.09, "learning_rate": 0.0002859084127910748, "loss": 0.0369, "step": 8690 }, { "epoch": 0.09, "learning_rate": 0.00028589219692547185, "loss": 0.0322, "step": 8700 }, { "epoch": 0.09, "learning_rate": 0.0002858759810598689, "loss": 0.0357, "step": 8710 }, { "epoch": 0.09, "learning_rate": 0.00028585976519426604, "loss": 0.0427, "step": 8720 }, { "epoch": 0.09, "learning_rate": 0.00028584354932866316, "loss": 0.0442, "step": 8730 }, { "epoch": 0.09, "learning_rate": 0.0002858273334630602, "loss": 0.041, "step": 8740 }, { "epoch": 0.09, "learning_rate": 0.00028581111759745734, "loss": 0.0381, "step": 8750 }, { "epoch": 0.09, "learning_rate": 0.0002857949017318544, "loss": 0.0382, "step": 8760 }, { "epoch": 0.09, "learning_rate": 0.00028577868586625153, "loss": 0.038, "step": 8770 }, { "epoch": 0.09, "learning_rate": 0.00028576247000064865, "loss": 0.0381, "step": 8780 }, { "epoch": 0.1, "learning_rate": 0.0002857462541350457, "loss": 0.0401, "step": 8790 }, { "epoch": 0.1, "learning_rate": 0.0002857300382694428, "loss": 0.0389, "step": 8800 }, { "epoch": 0.1, "learning_rate": 0.0002857138224038399, "loss": 0.039, "step": 8810 }, { "epoch": 0.1, "learning_rate": 0.000285697606538237, "loss": 0.0367, "step": 8820 }, { "epoch": 0.1, "learning_rate": 0.0002856813906726341, "loss": 0.0406, "step": 8830 }, { "epoch": 0.1, "learning_rate": 0.00028566517480703115, "loss": 0.042, "step": 8840 }, { "epoch": 0.1, "learning_rate": 0.00028564895894142827, "loss": 0.0371, "step": 8850 }, { "epoch": 0.1, "learning_rate": 0.0002856327430758254, "loss": 0.0373, "step": 8860 }, { "epoch": 0.1, "learning_rate": 0.00028561652721022246, "loss": 0.0328, "step": 8870 }, { "epoch": 0.1, "learning_rate": 0.0002856003113446195, "loss": 0.0324, "step": 8880 }, { "epoch": 0.1, "learning_rate": 0.00028558409547901664, "loss": 0.0344, "step": 8890 }, { "epoch": 0.1, "learning_rate": 0.00028556787961341376, "loss": 0.0392, "step": 8900 }, { "epoch": 0.1, "learning_rate": 0.00028555166374781083, "loss": 0.0405, "step": 8910 }, { "epoch": 0.1, "learning_rate": 0.00028553544788220795, "loss": 0.0334, "step": 8920 }, { "epoch": 0.1, "learning_rate": 0.000285519232016605, "loss": 0.0453, "step": 8930 }, { "epoch": 0.1, "learning_rate": 0.00028550301615100213, "loss": 0.0385, "step": 8940 }, { "epoch": 0.1, "learning_rate": 0.0002854868002853992, "loss": 0.0401, "step": 8950 }, { "epoch": 0.1, "learning_rate": 0.0002854705844197963, "loss": 0.0404, "step": 8960 }, { "epoch": 0.1, "learning_rate": 0.0002854543685541934, "loss": 0.0386, "step": 8970 }, { "epoch": 0.1, "learning_rate": 0.0002854381526885905, "loss": 0.038, "step": 8980 }, { "epoch": 0.1, "learning_rate": 0.00028542193682298757, "loss": 0.0369, "step": 8990 }, { "epoch": 0.1, "learning_rate": 0.0002854057209573847, "loss": 0.04, "step": 9000 }, { "epoch": 0.1, "eval_cer": 0.9215668902450677, "eval_loss": 0.028050633147358894, "eval_runtime": 119.8689, "eval_samples_per_second": 16.685, "eval_steps_per_second": 4.171, "step": 9000 }, { "epoch": 0.1, "learning_rate": 0.00028538950509178176, "loss": 0.0479, "step": 9010 }, { "epoch": 0.1, "learning_rate": 0.0002853732892261789, "loss": 0.0459, "step": 9020 }, { "epoch": 0.1, "learning_rate": 0.00028535707336057594, "loss": 0.0374, "step": 9030 }, { "epoch": 0.1, "learning_rate": 0.00028534085749497306, "loss": 0.0451, "step": 9040 }, { "epoch": 0.1, "learning_rate": 0.0002853246416293702, "loss": 0.0394, "step": 9050 }, { "epoch": 0.1, "learning_rate": 0.00028530842576376725, "loss": 0.0412, "step": 9060 }, { "epoch": 0.1, "learning_rate": 0.0002852922098981643, "loss": 0.0406, "step": 9070 }, { "epoch": 0.1, "learning_rate": 0.00028527599403256143, "loss": 0.0389, "step": 9080 }, { "epoch": 0.1, "learning_rate": 0.00028525977816695855, "loss": 0.0364, "step": 9090 }, { "epoch": 0.1, "learning_rate": 0.0002852435623013556, "loss": 0.0407, "step": 9100 }, { "epoch": 0.1, "learning_rate": 0.0002852273464357527, "loss": 0.0449, "step": 9110 }, { "epoch": 0.1, "learning_rate": 0.0002852111305701498, "loss": 0.045, "step": 9120 }, { "epoch": 0.1, "learning_rate": 0.0002851949147045469, "loss": 0.0459, "step": 9130 }, { "epoch": 0.1, "learning_rate": 0.000285178698838944, "loss": 0.0339, "step": 9140 }, { "epoch": 0.1, "learning_rate": 0.00028516248297334105, "loss": 0.0385, "step": 9150 }, { "epoch": 0.1, "learning_rate": 0.0002851462671077382, "loss": 0.0414, "step": 9160 }, { "epoch": 0.1, "learning_rate": 0.0002851300512421353, "loss": 0.0394, "step": 9170 }, { "epoch": 0.1, "learning_rate": 0.00028511383537653236, "loss": 0.0409, "step": 9180 }, { "epoch": 0.1, "learning_rate": 0.0002850976195109295, "loss": 0.0339, "step": 9190 }, { "epoch": 0.1, "learning_rate": 0.00028508140364532654, "loss": 0.0434, "step": 9200 }, { "epoch": 0.1, "learning_rate": 0.00028506518777972366, "loss": 0.0376, "step": 9210 }, { "epoch": 0.1, "learning_rate": 0.0002850489719141208, "loss": 0.0767, "step": 9220 }, { "epoch": 0.1, "learning_rate": 0.00028503275604851785, "loss": 0.0393, "step": 9230 }, { "epoch": 0.1, "learning_rate": 0.0002850165401829149, "loss": 0.0356, "step": 9240 }, { "epoch": 0.1, "learning_rate": 0.00028500032431731204, "loss": 0.037, "step": 9250 }, { "epoch": 0.1, "learning_rate": 0.00028498410845170916, "loss": 0.0411, "step": 9260 }, { "epoch": 0.1, "learning_rate": 0.0002849678925861062, "loss": 0.0377, "step": 9270 }, { "epoch": 0.1, "learning_rate": 0.0002849516767205033, "loss": 0.0385, "step": 9280 }, { "epoch": 0.1, "learning_rate": 0.0002849354608549004, "loss": 0.0434, "step": 9290 }, { "epoch": 0.1, "learning_rate": 0.0002849192449892975, "loss": 0.0373, "step": 9300 }, { "epoch": 0.1, "learning_rate": 0.0002849030291236946, "loss": 0.0348, "step": 9310 }, { "epoch": 0.1, "learning_rate": 0.00028488681325809166, "loss": 0.0355, "step": 9320 }, { "epoch": 0.1, "learning_rate": 0.0002848705973924888, "loss": 0.0367, "step": 9330 }, { "epoch": 0.1, "learning_rate": 0.0002848543815268859, "loss": 0.034, "step": 9340 }, { "epoch": 0.1, "learning_rate": 0.00028483816566128296, "loss": 0.0346, "step": 9350 }, { "epoch": 0.1, "learning_rate": 0.0002848219497956801, "loss": 0.0362, "step": 9360 }, { "epoch": 0.1, "learning_rate": 0.00028480573393007715, "loss": 0.0389, "step": 9370 }, { "epoch": 0.1, "learning_rate": 0.00028478951806447427, "loss": 0.0388, "step": 9380 }, { "epoch": 0.1, "learning_rate": 0.0002847733021988714, "loss": 0.0414, "step": 9390 }, { "epoch": 0.1, "learning_rate": 0.00028475708633326845, "loss": 0.0399, "step": 9400 }, { "epoch": 0.1, "learning_rate": 0.0002847408704676655, "loss": 0.0407, "step": 9410 }, { "epoch": 0.1, "learning_rate": 0.00028472465460206264, "loss": 0.0407, "step": 9420 }, { "epoch": 0.1, "learning_rate": 0.00028470843873645976, "loss": 0.0351, "step": 9430 }, { "epoch": 0.1, "learning_rate": 0.0002846922228708568, "loss": 0.0357, "step": 9440 }, { "epoch": 0.1, "learning_rate": 0.0002846760070052539, "loss": 0.0432, "step": 9450 }, { "epoch": 0.1, "learning_rate": 0.000284659791139651, "loss": 0.039, "step": 9460 }, { "epoch": 0.1, "learning_rate": 0.00028464357527404813, "loss": 0.0334, "step": 9470 }, { "epoch": 0.1, "learning_rate": 0.0002846273594084452, "loss": 0.044, "step": 9480 }, { "epoch": 0.1, "learning_rate": 0.0002846111435428423, "loss": 0.0516, "step": 9490 }, { "epoch": 0.1, "learning_rate": 0.0002845949276772394, "loss": 0.0345, "step": 9500 }, { "epoch": 0.1, "learning_rate": 0.0002845787118116365, "loss": 0.0382, "step": 9510 }, { "epoch": 0.1, "learning_rate": 0.00028456249594603357, "loss": 0.0419, "step": 9520 }, { "epoch": 0.1, "learning_rate": 0.0002845462800804307, "loss": 0.0423, "step": 9530 }, { "epoch": 0.1, "learning_rate": 0.00028453006421482775, "loss": 0.0382, "step": 9540 }, { "epoch": 0.1, "learning_rate": 0.00028451384834922487, "loss": 0.0382, "step": 9550 }, { "epoch": 0.1, "learning_rate": 0.00028449763248362194, "loss": 0.0343, "step": 9560 }, { "epoch": 0.1, "learning_rate": 0.00028448141661801906, "loss": 0.0381, "step": 9570 }, { "epoch": 0.1, "learning_rate": 0.0002844652007524161, "loss": 0.0355, "step": 9580 }, { "epoch": 0.1, "learning_rate": 0.00028444898488681324, "loss": 0.039, "step": 9590 }, { "epoch": 0.1, "learning_rate": 0.0002844327690212103, "loss": 0.0349, "step": 9600 }, { "epoch": 0.1, "learning_rate": 0.00028441655315560743, "loss": 0.0342, "step": 9610 }, { "epoch": 0.1, "learning_rate": 0.0002844003372900045, "loss": 0.0389, "step": 9620 }, { "epoch": 0.1, "learning_rate": 0.0002843841214244016, "loss": 0.0368, "step": 9630 }, { "epoch": 0.1, "learning_rate": 0.0002843679055587987, "loss": 0.0385, "step": 9640 }, { "epoch": 0.1, "learning_rate": 0.0002843516896931958, "loss": 0.0368, "step": 9650 }, { "epoch": 0.1, "learning_rate": 0.0002843354738275929, "loss": 0.0384, "step": 9660 }, { "epoch": 0.1, "learning_rate": 0.00028431925796199, "loss": 0.0406, "step": 9670 }, { "epoch": 0.1, "learning_rate": 0.00028430304209638705, "loss": 0.041, "step": 9680 }, { "epoch": 0.1, "learning_rate": 0.00028428682623078417, "loss": 0.036, "step": 9690 }, { "epoch": 0.1, "learning_rate": 0.0002842706103651813, "loss": 0.0384, "step": 9700 }, { "epoch": 0.1, "learning_rate": 0.00028425439449957836, "loss": 0.0349, "step": 9710 }, { "epoch": 0.11, "learning_rate": 0.0002842381786339754, "loss": 0.0364, "step": 9720 }, { "epoch": 0.11, "learning_rate": 0.00028422196276837254, "loss": 0.0372, "step": 9730 }, { "epoch": 0.11, "learning_rate": 0.00028420574690276966, "loss": 0.031, "step": 9740 }, { "epoch": 0.11, "learning_rate": 0.0002841895310371667, "loss": 0.0337, "step": 9750 }, { "epoch": 0.11, "learning_rate": 0.00028417331517156385, "loss": 0.0365, "step": 9760 }, { "epoch": 0.11, "learning_rate": 0.0002841570993059609, "loss": 0.0386, "step": 9770 }, { "epoch": 0.11, "learning_rate": 0.00028414088344035803, "loss": 0.0361, "step": 9780 }, { "epoch": 0.11, "learning_rate": 0.00028412466757475515, "loss": 0.0339, "step": 9790 }, { "epoch": 0.11, "learning_rate": 0.0002841084517091522, "loss": 0.0376, "step": 9800 }, { "epoch": 0.11, "learning_rate": 0.0002840922358435493, "loss": 0.0376, "step": 9810 }, { "epoch": 0.11, "learning_rate": 0.0002840760199779464, "loss": 0.0333, "step": 9820 }, { "epoch": 0.11, "learning_rate": 0.0002840598041123435, "loss": 0.0372, "step": 9830 }, { "epoch": 0.11, "learning_rate": 0.0002840435882467406, "loss": 0.031, "step": 9840 }, { "epoch": 0.11, "learning_rate": 0.00028402737238113765, "loss": 0.0422, "step": 9850 }, { "epoch": 0.11, "learning_rate": 0.0002840111565155348, "loss": 0.0336, "step": 9860 }, { "epoch": 0.11, "learning_rate": 0.0002839949406499319, "loss": 0.0402, "step": 9870 }, { "epoch": 0.11, "learning_rate": 0.00028397872478432896, "loss": 0.0339, "step": 9880 }, { "epoch": 0.11, "learning_rate": 0.000283962508918726, "loss": 0.033, "step": 9890 }, { "epoch": 0.11, "learning_rate": 0.00028394629305312314, "loss": 0.0346, "step": 9900 }, { "epoch": 0.11, "learning_rate": 0.00028393007718752026, "loss": 0.036, "step": 9910 }, { "epoch": 0.11, "learning_rate": 0.00028391386132191733, "loss": 0.0348, "step": 9920 }, { "epoch": 0.11, "learning_rate": 0.00028389764545631445, "loss": 0.0318, "step": 9930 }, { "epoch": 0.11, "learning_rate": 0.0002838814295907115, "loss": 0.0327, "step": 9940 }, { "epoch": 0.11, "learning_rate": 0.00028386521372510864, "loss": 0.0365, "step": 9950 }, { "epoch": 0.11, "learning_rate": 0.0002838489978595057, "loss": 0.0383, "step": 9960 }, { "epoch": 0.11, "learning_rate": 0.0002838327819939028, "loss": 0.0357, "step": 9970 }, { "epoch": 0.11, "learning_rate": 0.0002838165661282999, "loss": 0.0328, "step": 9980 }, { "epoch": 0.11, "learning_rate": 0.000283800350262697, "loss": 0.0395, "step": 9990 }, { "epoch": 0.11, "learning_rate": 0.00028378413439709407, "loss": 0.0307, "step": 10000 }, { "epoch": 0.11, "eval_cer": 0.921579050686457, "eval_loss": 0.02728099934756756, "eval_runtime": 119.7696, "eval_samples_per_second": 16.699, "eval_steps_per_second": 4.175, "step": 10000 }, { "epoch": 0.11, "learning_rate": 0.0002837679185314912, "loss": 0.0346, "step": 10010 }, { "epoch": 0.11, "learning_rate": 0.00028375170266588826, "loss": 0.0297, "step": 10020 }, { "epoch": 0.11, "learning_rate": 0.0002837354868002854, "loss": 0.0346, "step": 10030 }, { "epoch": 0.11, "learning_rate": 0.00028371927093468244, "loss": 0.0351, "step": 10040 }, { "epoch": 0.11, "learning_rate": 0.00028370305506907956, "loss": 0.0352, "step": 10050 }, { "epoch": 0.11, "learning_rate": 0.0002836868392034767, "loss": 0.0314, "step": 10060 }, { "epoch": 0.11, "learning_rate": 0.00028367062333787375, "loss": 0.0319, "step": 10070 }, { "epoch": 0.11, "learning_rate": 0.00028365440747227087, "loss": 0.0401, "step": 10080 }, { "epoch": 0.11, "learning_rate": 0.00028363819160666793, "loss": 0.0316, "step": 10090 }, { "epoch": 0.11, "learning_rate": 0.00028362197574106505, "loss": 0.0381, "step": 10100 }, { "epoch": 0.11, "learning_rate": 0.0002836057598754621, "loss": 0.0333, "step": 10110 }, { "epoch": 0.11, "learning_rate": 0.00028358954400985924, "loss": 0.0443, "step": 10120 }, { "epoch": 0.11, "learning_rate": 0.0002835733281442563, "loss": 0.0365, "step": 10130 }, { "epoch": 0.11, "learning_rate": 0.0002835571122786534, "loss": 0.0356, "step": 10140 }, { "epoch": 0.11, "learning_rate": 0.0002835408964130505, "loss": 0.0321, "step": 10150 }, { "epoch": 0.11, "learning_rate": 0.0002835246805474476, "loss": 0.0363, "step": 10160 }, { "epoch": 0.11, "learning_rate": 0.0002835084646818447, "loss": 0.0339, "step": 10170 }, { "epoch": 0.11, "learning_rate": 0.0002834922488162418, "loss": 0.0377, "step": 10180 }, { "epoch": 0.11, "learning_rate": 0.00028347603295063886, "loss": 0.0345, "step": 10190 }, { "epoch": 0.11, "learning_rate": 0.000283459817085036, "loss": 0.0306, "step": 10200 }, { "epoch": 0.11, "learning_rate": 0.00028344360121943305, "loss": 0.0327, "step": 10210 }, { "epoch": 0.11, "learning_rate": 0.00028342738535383017, "loss": 0.0399, "step": 10220 }, { "epoch": 0.11, "learning_rate": 0.0002834111694882273, "loss": 0.0361, "step": 10230 }, { "epoch": 0.11, "learning_rate": 0.00028339495362262435, "loss": 0.0394, "step": 10240 }, { "epoch": 0.11, "learning_rate": 0.0002833787377570214, "loss": 0.0379, "step": 10250 }, { "epoch": 0.11, "learning_rate": 0.00028336252189141854, "loss": 0.0395, "step": 10260 }, { "epoch": 0.11, "learning_rate": 0.00028334630602581566, "loss": 0.0454, "step": 10270 }, { "epoch": 0.11, "learning_rate": 0.0002833300901602127, "loss": 0.037, "step": 10280 }, { "epoch": 0.11, "learning_rate": 0.0002833138742946098, "loss": 0.0398, "step": 10290 }, { "epoch": 0.11, "learning_rate": 0.0002832976584290069, "loss": 0.0401, "step": 10300 }, { "epoch": 0.11, "learning_rate": 0.00028328144256340403, "loss": 0.0382, "step": 10310 }, { "epoch": 0.11, "learning_rate": 0.0002832652266978011, "loss": 0.0342, "step": 10320 }, { "epoch": 0.11, "learning_rate": 0.00028324901083219816, "loss": 0.0365, "step": 10330 }, { "epoch": 0.11, "learning_rate": 0.0002832327949665953, "loss": 0.0383, "step": 10340 }, { "epoch": 0.11, "learning_rate": 0.0002832165791009924, "loss": 0.036, "step": 10350 }, { "epoch": 0.11, "learning_rate": 0.0002832003632353895, "loss": 0.0428, "step": 10360 }, { "epoch": 0.11, "learning_rate": 0.0002831841473697866, "loss": 0.0386, "step": 10370 }, { "epoch": 0.11, "learning_rate": 0.00028316793150418365, "loss": 0.0379, "step": 10380 }, { "epoch": 0.11, "learning_rate": 0.00028315171563858077, "loss": 0.0444, "step": 10390 }, { "epoch": 0.11, "learning_rate": 0.0002831354997729779, "loss": 0.037, "step": 10400 }, { "epoch": 0.11, "learning_rate": 0.00028311928390737496, "loss": 0.0294, "step": 10410 }, { "epoch": 0.11, "learning_rate": 0.000283103068041772, "loss": 0.0387, "step": 10420 }, { "epoch": 0.11, "learning_rate": 0.00028308685217616914, "loss": 0.0341, "step": 10430 }, { "epoch": 0.11, "learning_rate": 0.00028307063631056626, "loss": 0.0369, "step": 10440 }, { "epoch": 0.11, "learning_rate": 0.00028305442044496333, "loss": 0.0326, "step": 10450 }, { "epoch": 0.11, "learning_rate": 0.0002830382045793604, "loss": 0.0367, "step": 10460 }, { "epoch": 0.11, "learning_rate": 0.0002830219887137575, "loss": 0.0321, "step": 10470 }, { "epoch": 0.11, "learning_rate": 0.00028300577284815463, "loss": 0.0335, "step": 10480 }, { "epoch": 0.11, "learning_rate": 0.0002829895569825517, "loss": 0.0392, "step": 10490 }, { "epoch": 0.11, "learning_rate": 0.0002829733411169488, "loss": 0.0382, "step": 10500 }, { "epoch": 0.11, "learning_rate": 0.0002829571252513459, "loss": 0.0367, "step": 10510 }, { "epoch": 0.11, "learning_rate": 0.000282940909385743, "loss": 0.0327, "step": 10520 }, { "epoch": 0.11, "learning_rate": 0.00028292469352014007, "loss": 0.0356, "step": 10530 }, { "epoch": 0.11, "learning_rate": 0.0002829084776545372, "loss": 0.0324, "step": 10540 }, { "epoch": 0.11, "learning_rate": 0.00028289226178893425, "loss": 0.0349, "step": 10550 }, { "epoch": 0.11, "learning_rate": 0.0002828760459233314, "loss": 0.0317, "step": 10560 }, { "epoch": 0.11, "learning_rate": 0.00028285983005772844, "loss": 0.0333, "step": 10570 }, { "epoch": 0.11, "learning_rate": 0.00028284361419212556, "loss": 0.04, "step": 10580 }, { "epoch": 0.11, "learning_rate": 0.0002828273983265226, "loss": 0.0338, "step": 10590 }, { "epoch": 0.11, "learning_rate": 0.00028281118246091975, "loss": 0.0384, "step": 10600 }, { "epoch": 0.11, "learning_rate": 0.0002827949665953168, "loss": 0.0359, "step": 10610 }, { "epoch": 0.11, "learning_rate": 0.00028277875072971393, "loss": 0.0383, "step": 10620 }, { "epoch": 0.11, "learning_rate": 0.000282762534864111, "loss": 0.0379, "step": 10630 }, { "epoch": 0.12, "learning_rate": 0.0002827463189985081, "loss": 0.0375, "step": 10640 }, { "epoch": 0.12, "learning_rate": 0.0002827301031329052, "loss": 0.0315, "step": 10650 }, { "epoch": 0.12, "learning_rate": 0.0002827138872673023, "loss": 0.0348, "step": 10660 }, { "epoch": 0.12, "learning_rate": 0.0002826976714016994, "loss": 0.0369, "step": 10670 }, { "epoch": 0.12, "learning_rate": 0.0002826814555360965, "loss": 0.0387, "step": 10680 }, { "epoch": 0.12, "learning_rate": 0.00028266523967049355, "loss": 0.0339, "step": 10690 }, { "epoch": 0.12, "learning_rate": 0.00028264902380489067, "loss": 0.0396, "step": 10700 }, { "epoch": 0.12, "learning_rate": 0.0002826328079392878, "loss": 0.0427, "step": 10710 }, { "epoch": 0.12, "learning_rate": 0.00028261659207368486, "loss": 0.0358, "step": 10720 }, { "epoch": 0.12, "learning_rate": 0.0002826003762080819, "loss": 0.0349, "step": 10730 }, { "epoch": 0.12, "learning_rate": 0.00028258416034247904, "loss": 0.0361, "step": 10740 }, { "epoch": 0.12, "learning_rate": 0.00028256794447687616, "loss": 0.0349, "step": 10750 }, { "epoch": 0.12, "learning_rate": 0.00028255172861127323, "loss": 0.0338, "step": 10760 }, { "epoch": 0.12, "learning_rate": 0.00028253551274567035, "loss": 0.0427, "step": 10770 }, { "epoch": 0.12, "learning_rate": 0.0002825192968800674, "loss": 0.0495, "step": 10780 }, { "epoch": 0.12, "learning_rate": 0.00028250308101446453, "loss": 0.0354, "step": 10790 }, { "epoch": 0.12, "learning_rate": 0.00028248686514886165, "loss": 0.0358, "step": 10800 }, { "epoch": 0.12, "learning_rate": 0.0002824706492832587, "loss": 0.0326, "step": 10810 }, { "epoch": 0.12, "learning_rate": 0.0002824544334176558, "loss": 0.0406, "step": 10820 }, { "epoch": 0.12, "learning_rate": 0.0002824382175520529, "loss": 0.0319, "step": 10830 }, { "epoch": 0.12, "learning_rate": 0.00028242200168645, "loss": 0.0334, "step": 10840 }, { "epoch": 0.12, "learning_rate": 0.0002824057858208471, "loss": 0.0376, "step": 10850 }, { "epoch": 0.12, "learning_rate": 0.00028238956995524416, "loss": 0.0442, "step": 10860 }, { "epoch": 0.12, "learning_rate": 0.0002823733540896413, "loss": 0.0419, "step": 10870 }, { "epoch": 0.12, "learning_rate": 0.0002823571382240384, "loss": 0.0417, "step": 10880 }, { "epoch": 0.12, "learning_rate": 0.00028234092235843546, "loss": 0.0368, "step": 10890 }, { "epoch": 0.12, "learning_rate": 0.00028232470649283253, "loss": 0.0304, "step": 10900 }, { "epoch": 0.12, "learning_rate": 0.00028230849062722965, "loss": 0.0378, "step": 10910 }, { "epoch": 0.12, "learning_rate": 0.00028229227476162677, "loss": 0.0416, "step": 10920 }, { "epoch": 0.12, "learning_rate": 0.00028227605889602383, "loss": 0.0413, "step": 10930 }, { "epoch": 0.12, "learning_rate": 0.00028225984303042095, "loss": 0.0343, "step": 10940 }, { "epoch": 0.12, "learning_rate": 0.000282243627164818, "loss": 0.0389, "step": 10950 }, { "epoch": 0.12, "learning_rate": 0.00028222741129921514, "loss": 0.0385, "step": 10960 }, { "epoch": 0.12, "learning_rate": 0.00028221119543361226, "loss": 0.0358, "step": 10970 }, { "epoch": 0.12, "learning_rate": 0.0002821949795680093, "loss": 0.0339, "step": 10980 }, { "epoch": 0.12, "learning_rate": 0.0002821787637024064, "loss": 0.0344, "step": 10990 }, { "epoch": 0.12, "learning_rate": 0.0002821625478368035, "loss": 0.0382, "step": 11000 }, { "epoch": 0.12, "eval_cer": 0.9215694960539368, "eval_loss": 0.02685784548521042, "eval_runtime": 119.8402, "eval_samples_per_second": 16.689, "eval_steps_per_second": 4.172, "step": 11000 }, { "epoch": 0.12, "learning_rate": 0.00028214633197120063, "loss": 0.0346, "step": 11010 }, { "epoch": 0.12, "learning_rate": 0.0002821301161055977, "loss": 0.0357, "step": 11020 }, { "epoch": 0.12, "learning_rate": 0.00028211390023999476, "loss": 0.0346, "step": 11030 }, { "epoch": 0.12, "learning_rate": 0.0002820976843743919, "loss": 0.0367, "step": 11040 }, { "epoch": 0.12, "learning_rate": 0.000282081468508789, "loss": 0.036, "step": 11050 }, { "epoch": 0.12, "learning_rate": 0.00028206525264318607, "loss": 0.0408, "step": 11060 }, { "epoch": 0.12, "learning_rate": 0.0002820490367775832, "loss": 0.0321, "step": 11070 }, { "epoch": 0.12, "learning_rate": 0.00028203282091198025, "loss": 0.043, "step": 11080 }, { "epoch": 0.12, "learning_rate": 0.00028201660504637737, "loss": 0.0364, "step": 11090 }, { "epoch": 0.12, "learning_rate": 0.00028200038918077444, "loss": 0.0373, "step": 11100 }, { "epoch": 0.12, "learning_rate": 0.00028198417331517156, "loss": 0.0451, "step": 11110 }, { "epoch": 0.12, "learning_rate": 0.0002819679574495686, "loss": 0.0317, "step": 11120 }, { "epoch": 0.12, "learning_rate": 0.00028195174158396574, "loss": 0.0345, "step": 11130 }, { "epoch": 0.12, "learning_rate": 0.0002819355257183628, "loss": 0.0376, "step": 11140 }, { "epoch": 0.12, "learning_rate": 0.00028191930985275993, "loss": 0.038, "step": 11150 }, { "epoch": 0.12, "learning_rate": 0.000281903093987157, "loss": 0.0364, "step": 11160 }, { "epoch": 0.12, "learning_rate": 0.0002818868781215541, "loss": 0.0389, "step": 11170 }, { "epoch": 0.12, "learning_rate": 0.0002818706622559512, "loss": 0.036, "step": 11180 }, { "epoch": 0.12, "learning_rate": 0.0002818544463903483, "loss": 0.034, "step": 11190 }, { "epoch": 0.12, "learning_rate": 0.00028183823052474536, "loss": 0.0349, "step": 11200 }, { "epoch": 0.12, "learning_rate": 0.0002818220146591425, "loss": 0.0335, "step": 11210 }, { "epoch": 0.12, "learning_rate": 0.00028180579879353955, "loss": 0.0338, "step": 11220 }, { "epoch": 0.12, "learning_rate": 0.00028178958292793667, "loss": 0.035, "step": 11230 }, { "epoch": 0.12, "learning_rate": 0.0002817733670623338, "loss": 0.041, "step": 11240 }, { "epoch": 0.12, "learning_rate": 0.00028175715119673086, "loss": 0.0395, "step": 11250 }, { "epoch": 0.12, "learning_rate": 0.0002817409353311279, "loss": 0.0326, "step": 11260 }, { "epoch": 0.12, "learning_rate": 0.00028172471946552504, "loss": 0.0388, "step": 11270 }, { "epoch": 0.12, "learning_rate": 0.00028170850359992216, "loss": 0.0362, "step": 11280 }, { "epoch": 0.12, "learning_rate": 0.0002816922877343192, "loss": 0.0391, "step": 11290 }, { "epoch": 0.12, "learning_rate": 0.0002816760718687163, "loss": 0.0399, "step": 11300 }, { "epoch": 0.12, "learning_rate": 0.0002816598560031134, "loss": 0.0374, "step": 11310 }, { "epoch": 0.12, "learning_rate": 0.00028164364013751053, "loss": 0.0334, "step": 11320 }, { "epoch": 0.12, "learning_rate": 0.0002816274242719076, "loss": 0.036, "step": 11330 }, { "epoch": 0.12, "learning_rate": 0.00028161120840630466, "loss": 0.0376, "step": 11340 }, { "epoch": 0.12, "learning_rate": 0.0002815949925407018, "loss": 0.0368, "step": 11350 }, { "epoch": 0.12, "learning_rate": 0.0002815787766750989, "loss": 0.0401, "step": 11360 }, { "epoch": 0.12, "learning_rate": 0.000281562560809496, "loss": 0.0335, "step": 11370 }, { "epoch": 0.12, "learning_rate": 0.0002815463449438931, "loss": 0.0352, "step": 11380 }, { "epoch": 0.12, "learning_rate": 0.00028153012907829015, "loss": 0.0387, "step": 11390 }, { "epoch": 0.12, "learning_rate": 0.0002815139132126873, "loss": 0.0322, "step": 11400 }, { "epoch": 0.12, "learning_rate": 0.0002814976973470844, "loss": 0.0347, "step": 11410 }, { "epoch": 0.12, "learning_rate": 0.00028148148148148146, "loss": 0.0359, "step": 11420 }, { "epoch": 0.12, "learning_rate": 0.0002814652656158785, "loss": 0.0307, "step": 11430 }, { "epoch": 0.12, "learning_rate": 0.00028144904975027564, "loss": 0.0368, "step": 11440 }, { "epoch": 0.12, "learning_rate": 0.00028143283388467276, "loss": 0.0382, "step": 11450 }, { "epoch": 0.12, "learning_rate": 0.00028141661801906983, "loss": 0.031, "step": 11460 }, { "epoch": 0.12, "learning_rate": 0.0002814004021534669, "loss": 0.0331, "step": 11470 }, { "epoch": 0.12, "learning_rate": 0.000281384186287864, "loss": 0.038, "step": 11480 }, { "epoch": 0.12, "learning_rate": 0.00028136797042226114, "loss": 0.0345, "step": 11490 }, { "epoch": 0.12, "learning_rate": 0.0002813517545566582, "loss": 0.0398, "step": 11500 }, { "epoch": 0.12, "learning_rate": 0.0002813355386910553, "loss": 0.0353, "step": 11510 }, { "epoch": 0.12, "learning_rate": 0.0002813193228254524, "loss": 0.0367, "step": 11520 }, { "epoch": 0.12, "learning_rate": 0.0002813031069598495, "loss": 0.0308, "step": 11530 }, { "epoch": 0.12, "learning_rate": 0.0002812868910942466, "loss": 0.0353, "step": 11540 }, { "epoch": 0.12, "learning_rate": 0.0002812706752286437, "loss": 0.0368, "step": 11550 }, { "epoch": 0.12, "learning_rate": 0.00028125445936304076, "loss": 0.0378, "step": 11560 }, { "epoch": 0.13, "learning_rate": 0.0002812382434974379, "loss": 0.0378, "step": 11570 }, { "epoch": 0.13, "learning_rate": 0.000281222027631835, "loss": 0.0357, "step": 11580 }, { "epoch": 0.13, "learning_rate": 0.00028120581176623206, "loss": 0.0403, "step": 11590 }, { "epoch": 0.13, "learning_rate": 0.00028118959590062913, "loss": 0.0353, "step": 11600 }, { "epoch": 0.13, "learning_rate": 0.00028117338003502625, "loss": 0.0373, "step": 11610 }, { "epoch": 0.13, "learning_rate": 0.00028115716416942337, "loss": 0.0343, "step": 11620 }, { "epoch": 0.13, "learning_rate": 0.00028114094830382043, "loss": 0.0333, "step": 11630 }, { "epoch": 0.13, "learning_rate": 0.0002811247324382175, "loss": 0.035, "step": 11640 }, { "epoch": 0.13, "learning_rate": 0.0002811085165726146, "loss": 0.0281, "step": 11650 }, { "epoch": 0.13, "learning_rate": 0.00028109230070701174, "loss": 0.0279, "step": 11660 }, { "epoch": 0.13, "learning_rate": 0.0002810760848414088, "loss": 0.0326, "step": 11670 }, { "epoch": 0.13, "learning_rate": 0.0002810598689758059, "loss": 0.0391, "step": 11680 }, { "epoch": 0.13, "learning_rate": 0.000281043653110203, "loss": 0.0394, "step": 11690 }, { "epoch": 0.13, "learning_rate": 0.0002810274372446001, "loss": 0.0433, "step": 11700 }, { "epoch": 0.13, "learning_rate": 0.0002810112213789972, "loss": 0.0362, "step": 11710 }, { "epoch": 0.13, "learning_rate": 0.0002809950055133943, "loss": 0.0335, "step": 11720 }, { "epoch": 0.13, "learning_rate": 0.00028097878964779136, "loss": 0.0378, "step": 11730 }, { "epoch": 0.13, "learning_rate": 0.0002809625737821885, "loss": 0.0295, "step": 11740 }, { "epoch": 0.13, "learning_rate": 0.00028094635791658555, "loss": 0.0383, "step": 11750 }, { "epoch": 0.13, "learning_rate": 0.00028093014205098267, "loss": 0.0334, "step": 11760 }, { "epoch": 0.13, "learning_rate": 0.00028091392618537973, "loss": 0.0376, "step": 11770 }, { "epoch": 0.13, "learning_rate": 0.00028089771031977685, "loss": 0.0351, "step": 11780 }, { "epoch": 0.13, "learning_rate": 0.0002808814944541739, "loss": 0.0368, "step": 11790 }, { "epoch": 0.13, "learning_rate": 0.00028086527858857104, "loss": 0.0351, "step": 11800 }, { "epoch": 0.13, "learning_rate": 0.00028084906272296816, "loss": 0.0327, "step": 11810 }, { "epoch": 0.13, "learning_rate": 0.0002808328468573652, "loss": 0.0356, "step": 11820 }, { "epoch": 0.13, "learning_rate": 0.0002808166309917623, "loss": 0.0331, "step": 11830 }, { "epoch": 0.13, "learning_rate": 0.0002808004151261594, "loss": 0.0345, "step": 11840 }, { "epoch": 0.13, "learning_rate": 0.00028078419926055653, "loss": 0.0393, "step": 11850 }, { "epoch": 0.13, "learning_rate": 0.0002807679833949536, "loss": 0.0329, "step": 11860 }, { "epoch": 0.13, "learning_rate": 0.00028075176752935066, "loss": 0.0365, "step": 11870 }, { "epoch": 0.13, "learning_rate": 0.0002807355516637478, "loss": 0.038, "step": 11880 }, { "epoch": 0.13, "learning_rate": 0.0002807193357981449, "loss": 0.0315, "step": 11890 }, { "epoch": 0.13, "learning_rate": 0.00028070311993254196, "loss": 0.036, "step": 11900 }, { "epoch": 0.13, "learning_rate": 0.00028068690406693903, "loss": 0.0353, "step": 11910 }, { "epoch": 0.13, "learning_rate": 0.00028067068820133615, "loss": 0.0365, "step": 11920 }, { "epoch": 0.13, "learning_rate": 0.00028065447233573327, "loss": 0.0402, "step": 11930 }, { "epoch": 0.13, "learning_rate": 0.00028063825647013034, "loss": 0.0368, "step": 11940 }, { "epoch": 0.13, "learning_rate": 0.00028062204060452746, "loss": 0.0351, "step": 11950 }, { "epoch": 0.13, "learning_rate": 0.0002806058247389245, "loss": 0.0343, "step": 11960 }, { "epoch": 0.13, "learning_rate": 0.00028058960887332164, "loss": 0.0318, "step": 11970 }, { "epoch": 0.13, "learning_rate": 0.00028057339300771876, "loss": 0.0402, "step": 11980 }, { "epoch": 0.13, "learning_rate": 0.0002805571771421158, "loss": 0.0445, "step": 11990 }, { "epoch": 0.13, "learning_rate": 0.0002805409612765129, "loss": 0.036, "step": 12000 }, { "epoch": 0.13, "eval_cer": 0.9215616786273294, "eval_loss": 0.025386789813637733, "eval_runtime": 119.9223, "eval_samples_per_second": 16.677, "eval_steps_per_second": 4.169, "step": 12000 }, { "epoch": 0.13, "learning_rate": 0.00028052474541091, "loss": 0.0339, "step": 12010 }, { "epoch": 0.13, "learning_rate": 0.00028050852954530713, "loss": 0.0388, "step": 12020 }, { "epoch": 0.13, "learning_rate": 0.0002804923136797042, "loss": 0.0365, "step": 12030 }, { "epoch": 0.13, "learning_rate": 0.00028047609781410126, "loss": 0.0401, "step": 12040 }, { "epoch": 0.13, "learning_rate": 0.0002804598819484984, "loss": 0.031, "step": 12050 }, { "epoch": 0.13, "learning_rate": 0.0002804436660828955, "loss": 0.0402, "step": 12060 }, { "epoch": 0.13, "learning_rate": 0.00028042745021729257, "loss": 0.0339, "step": 12070 }, { "epoch": 0.13, "learning_rate": 0.0002804112343516897, "loss": 0.0331, "step": 12080 }, { "epoch": 0.13, "learning_rate": 0.00028039501848608675, "loss": 0.0348, "step": 12090 }, { "epoch": 0.13, "learning_rate": 0.0002803788026204839, "loss": 0.0341, "step": 12100 }, { "epoch": 0.13, "learning_rate": 0.00028036258675488094, "loss": 0.0339, "step": 12110 }, { "epoch": 0.13, "learning_rate": 0.00028034637088927806, "loss": 0.0316, "step": 12120 }, { "epoch": 0.13, "learning_rate": 0.0002803301550236751, "loss": 0.0399, "step": 12130 }, { "epoch": 0.13, "learning_rate": 0.00028031393915807224, "loss": 0.0306, "step": 12140 }, { "epoch": 0.13, "learning_rate": 0.0002802977232924693, "loss": 0.0281, "step": 12150 }, { "epoch": 0.13, "learning_rate": 0.00028028150742686643, "loss": 0.0263, "step": 12160 }, { "epoch": 0.13, "learning_rate": 0.0002802652915612635, "loss": 0.0331, "step": 12170 }, { "epoch": 0.13, "learning_rate": 0.0002802490756956606, "loss": 0.0304, "step": 12180 }, { "epoch": 0.13, "learning_rate": 0.0002802328598300577, "loss": 0.0315, "step": 12190 }, { "epoch": 0.13, "learning_rate": 0.0002802166439644548, "loss": 0.0376, "step": 12200 }, { "epoch": 0.13, "learning_rate": 0.00028020042809885187, "loss": 0.0355, "step": 12210 }, { "epoch": 0.13, "learning_rate": 0.000280184212233249, "loss": 0.0309, "step": 12220 }, { "epoch": 0.13, "learning_rate": 0.0002801679963676461, "loss": 0.0356, "step": 12230 }, { "epoch": 0.13, "learning_rate": 0.00028015178050204317, "loss": 0.0319, "step": 12240 }, { "epoch": 0.13, "learning_rate": 0.0002801355646364403, "loss": 0.0351, "step": 12250 }, { "epoch": 0.13, "learning_rate": 0.00028011934877083736, "loss": 0.0313, "step": 12260 }, { "epoch": 0.13, "learning_rate": 0.0002801031329052345, "loss": 0.0359, "step": 12270 }, { "epoch": 0.13, "learning_rate": 0.00028008691703963154, "loss": 0.0397, "step": 12280 }, { "epoch": 0.13, "learning_rate": 0.00028007070117402866, "loss": 0.0356, "step": 12290 }, { "epoch": 0.13, "learning_rate": 0.00028005448530842573, "loss": 0.0361, "step": 12300 }, { "epoch": 0.13, "learning_rate": 0.00028003826944282285, "loss": 0.0334, "step": 12310 }, { "epoch": 0.13, "learning_rate": 0.0002800220535772199, "loss": 0.0355, "step": 12320 }, { "epoch": 0.13, "learning_rate": 0.00028000583771161703, "loss": 0.0317, "step": 12330 }, { "epoch": 0.13, "learning_rate": 0.0002799896218460141, "loss": 0.0292, "step": 12340 }, { "epoch": 0.13, "learning_rate": 0.0002799734059804112, "loss": 0.0335, "step": 12350 }, { "epoch": 0.13, "learning_rate": 0.0002799571901148083, "loss": 0.0342, "step": 12360 }, { "epoch": 0.13, "learning_rate": 0.0002799409742492054, "loss": 0.0343, "step": 12370 }, { "epoch": 0.13, "learning_rate": 0.0002799247583836025, "loss": 0.0332, "step": 12380 }, { "epoch": 0.13, "learning_rate": 0.0002799085425179996, "loss": 0.0341, "step": 12390 }, { "epoch": 0.13, "learning_rate": 0.00027989232665239666, "loss": 0.0351, "step": 12400 }, { "epoch": 0.13, "learning_rate": 0.0002798761107867938, "loss": 0.0345, "step": 12410 }, { "epoch": 0.13, "learning_rate": 0.0002798598949211909, "loss": 0.0326, "step": 12420 }, { "epoch": 0.13, "learning_rate": 0.00027984367905558796, "loss": 0.032, "step": 12430 }, { "epoch": 0.13, "learning_rate": 0.000279827463189985, "loss": 0.0405, "step": 12440 }, { "epoch": 0.13, "learning_rate": 0.00027981124732438215, "loss": 0.0384, "step": 12450 }, { "epoch": 0.13, "learning_rate": 0.00027979503145877927, "loss": 0.039, "step": 12460 }, { "epoch": 0.13, "learning_rate": 0.00027977881559317633, "loss": 0.0309, "step": 12470 }, { "epoch": 0.13, "learning_rate": 0.0002797625997275734, "loss": 0.0313, "step": 12480 }, { "epoch": 0.14, "learning_rate": 0.0002797463838619705, "loss": 0.0408, "step": 12490 }, { "epoch": 0.14, "learning_rate": 0.00027973016799636764, "loss": 0.0338, "step": 12500 }, { "epoch": 0.14, "learning_rate": 0.0002797139521307647, "loss": 0.0326, "step": 12510 }, { "epoch": 0.14, "learning_rate": 0.0002796977362651618, "loss": 0.0331, "step": 12520 }, { "epoch": 0.14, "learning_rate": 0.0002796815203995589, "loss": 0.0292, "step": 12530 }, { "epoch": 0.14, "learning_rate": 0.000279665304533956, "loss": 0.0299, "step": 12540 }, { "epoch": 0.14, "learning_rate": 0.00027964908866835313, "loss": 0.0324, "step": 12550 }, { "epoch": 0.14, "learning_rate": 0.0002796328728027502, "loss": 0.0287, "step": 12560 }, { "epoch": 0.14, "learning_rate": 0.00027961665693714726, "loss": 0.0395, "step": 12570 }, { "epoch": 0.14, "learning_rate": 0.0002796004410715444, "loss": 0.0369, "step": 12580 }, { "epoch": 0.14, "learning_rate": 0.0002795842252059415, "loss": 0.0318, "step": 12590 }, { "epoch": 0.14, "learning_rate": 0.00027956800934033857, "loss": 0.0341, "step": 12600 }, { "epoch": 0.14, "learning_rate": 0.00027955179347473563, "loss": 0.0351, "step": 12610 }, { "epoch": 0.14, "learning_rate": 0.00027953557760913275, "loss": 0.0343, "step": 12620 }, { "epoch": 0.14, "learning_rate": 0.00027951936174352987, "loss": 0.028, "step": 12630 }, { "epoch": 0.14, "learning_rate": 0.00027950314587792694, "loss": 0.0339, "step": 12640 }, { "epoch": 0.14, "learning_rate": 0.000279486930012324, "loss": 0.0329, "step": 12650 }, { "epoch": 0.14, "learning_rate": 0.0002794707141467211, "loss": 0.0363, "step": 12660 }, { "epoch": 0.14, "learning_rate": 0.00027945449828111824, "loss": 0.0466, "step": 12670 }, { "epoch": 0.14, "learning_rate": 0.0002794382824155153, "loss": 0.0397, "step": 12680 }, { "epoch": 0.14, "learning_rate": 0.0002794220665499124, "loss": 0.0314, "step": 12690 }, { "epoch": 0.14, "learning_rate": 0.0002794058506843095, "loss": 0.0332, "step": 12700 }, { "epoch": 0.14, "learning_rate": 0.0002793896348187066, "loss": 0.0311, "step": 12710 }, { "epoch": 0.14, "learning_rate": 0.0002793734189531037, "loss": 0.0363, "step": 12720 }, { "epoch": 0.14, "learning_rate": 0.0002793572030875008, "loss": 0.032, "step": 12730 }, { "epoch": 0.14, "learning_rate": 0.00027934098722189786, "loss": 0.0325, "step": 12740 }, { "epoch": 0.14, "learning_rate": 0.000279324771356295, "loss": 0.0335, "step": 12750 }, { "epoch": 0.14, "learning_rate": 0.00027930855549069205, "loss": 0.032, "step": 12760 }, { "epoch": 0.14, "learning_rate": 0.00027929233962508917, "loss": 0.0328, "step": 12770 }, { "epoch": 0.14, "learning_rate": 0.00027927612375948623, "loss": 0.0303, "step": 12780 }, { "epoch": 0.14, "learning_rate": 0.00027925990789388335, "loss": 0.0337, "step": 12790 }, { "epoch": 0.14, "learning_rate": 0.0002792436920282804, "loss": 0.035, "step": 12800 }, { "epoch": 0.14, "learning_rate": 0.00027922747616267754, "loss": 0.0322, "step": 12810 }, { "epoch": 0.14, "learning_rate": 0.00027921126029707466, "loss": 0.0353, "step": 12820 }, { "epoch": 0.14, "learning_rate": 0.0002791950444314717, "loss": 0.0376, "step": 12830 }, { "epoch": 0.14, "learning_rate": 0.0002791788285658688, "loss": 0.0376, "step": 12840 }, { "epoch": 0.14, "learning_rate": 0.0002791626127002659, "loss": 0.0364, "step": 12850 }, { "epoch": 0.14, "learning_rate": 0.00027914639683466303, "loss": 0.0348, "step": 12860 }, { "epoch": 0.14, "learning_rate": 0.0002791301809690601, "loss": 0.0354, "step": 12870 }, { "epoch": 0.14, "learning_rate": 0.00027911396510345716, "loss": 0.0455, "step": 12880 }, { "epoch": 0.14, "learning_rate": 0.0002790977492378543, "loss": 0.0382, "step": 12890 }, { "epoch": 0.14, "learning_rate": 0.0002790815333722514, "loss": 0.0423, "step": 12900 }, { "epoch": 0.14, "learning_rate": 0.00027906531750664847, "loss": 0.0341, "step": 12910 }, { "epoch": 0.14, "learning_rate": 0.00027904910164104553, "loss": 0.0424, "step": 12920 }, { "epoch": 0.14, "learning_rate": 0.00027903288577544265, "loss": 0.0346, "step": 12930 }, { "epoch": 0.14, "learning_rate": 0.00027901666990983977, "loss": 0.0318, "step": 12940 }, { "epoch": 0.14, "learning_rate": 0.00027900045404423684, "loss": 0.0331, "step": 12950 }, { "epoch": 0.14, "learning_rate": 0.00027898423817863396, "loss": 0.033, "step": 12960 }, { "epoch": 0.14, "learning_rate": 0.000278968022313031, "loss": 0.0324, "step": 12970 }, { "epoch": 0.14, "learning_rate": 0.00027895180644742814, "loss": 0.0325, "step": 12980 }, { "epoch": 0.14, "learning_rate": 0.00027893559058182526, "loss": 0.0325, "step": 12990 }, { "epoch": 0.14, "learning_rate": 0.00027891937471622233, "loss": 0.0412, "step": 13000 }, { "epoch": 0.14, "eval_cer": 0.9216059773781046, "eval_loss": 0.025849705561995506, "eval_runtime": 120.1846, "eval_samples_per_second": 16.641, "eval_steps_per_second": 4.16, "step": 13000 }, { "epoch": 0.14, "learning_rate": 0.0002789031588506194, "loss": 0.0486, "step": 13010 }, { "epoch": 0.14, "learning_rate": 0.0002788869429850165, "loss": 0.0407, "step": 13020 }, { "epoch": 0.14, "learning_rate": 0.00027887072711941363, "loss": 0.0337, "step": 13030 }, { "epoch": 0.14, "learning_rate": 0.0002788545112538107, "loss": 0.0411, "step": 13040 }, { "epoch": 0.14, "learning_rate": 0.00027883829538820777, "loss": 0.0356, "step": 13050 }, { "epoch": 0.14, "learning_rate": 0.0002788220795226049, "loss": 0.0417, "step": 13060 }, { "epoch": 0.14, "learning_rate": 0.000278805863657002, "loss": 0.0295, "step": 13070 }, { "epoch": 0.14, "learning_rate": 0.00027878964779139907, "loss": 0.0361, "step": 13080 }, { "epoch": 0.14, "learning_rate": 0.0002787734319257962, "loss": 0.033, "step": 13090 }, { "epoch": 0.14, "learning_rate": 0.00027875721606019326, "loss": 0.0347, "step": 13100 }, { "epoch": 0.14, "learning_rate": 0.0002787410001945904, "loss": 0.0313, "step": 13110 }, { "epoch": 0.14, "learning_rate": 0.0002787247843289875, "loss": 0.0395, "step": 13120 }, { "epoch": 0.14, "learning_rate": 0.00027870856846338456, "loss": 0.0346, "step": 13130 }, { "epoch": 0.14, "learning_rate": 0.00027869235259778163, "loss": 0.0309, "step": 13140 }, { "epoch": 0.14, "learning_rate": 0.00027867613673217875, "loss": 0.045, "step": 13150 }, { "epoch": 0.14, "learning_rate": 0.00027865992086657587, "loss": 0.0347, "step": 13160 }, { "epoch": 0.14, "learning_rate": 0.00027864370500097293, "loss": 0.0355, "step": 13170 }, { "epoch": 0.14, "learning_rate": 0.00027862748913537, "loss": 0.0426, "step": 13180 }, { "epoch": 0.14, "learning_rate": 0.0002786112732697671, "loss": 0.045, "step": 13190 }, { "epoch": 0.14, "learning_rate": 0.00027859505740416424, "loss": 0.0338, "step": 13200 }, { "epoch": 0.14, "learning_rate": 0.0002785788415385613, "loss": 0.0324, "step": 13210 }, { "epoch": 0.14, "learning_rate": 0.00027856262567295837, "loss": 0.0338, "step": 13220 }, { "epoch": 0.14, "learning_rate": 0.0002785464098073555, "loss": 0.0333, "step": 13230 }, { "epoch": 0.14, "learning_rate": 0.0002785301939417526, "loss": 0.0844, "step": 13240 }, { "epoch": 0.14, "learning_rate": 0.0002785139780761497, "loss": 0.0348, "step": 13250 }, { "epoch": 0.14, "learning_rate": 0.0002784977622105468, "loss": 0.0342, "step": 13260 }, { "epoch": 0.14, "learning_rate": 0.00027848154634494386, "loss": 0.0345, "step": 13270 }, { "epoch": 0.14, "learning_rate": 0.000278465330479341, "loss": 0.0353, "step": 13280 }, { "epoch": 0.14, "learning_rate": 0.00027844911461373805, "loss": 0.0313, "step": 13290 }, { "epoch": 0.14, "learning_rate": 0.00027843289874813517, "loss": 0.0368, "step": 13300 }, { "epoch": 0.14, "learning_rate": 0.00027841668288253223, "loss": 0.0314, "step": 13310 }, { "epoch": 0.14, "learning_rate": 0.00027840046701692935, "loss": 0.0349, "step": 13320 }, { "epoch": 0.14, "learning_rate": 0.0002783842511513264, "loss": 0.0358, "step": 13330 }, { "epoch": 0.14, "learning_rate": 0.00027836803528572354, "loss": 0.034, "step": 13340 }, { "epoch": 0.14, "learning_rate": 0.0002783518194201206, "loss": 0.0474, "step": 13350 }, { "epoch": 0.14, "learning_rate": 0.0002783356035545177, "loss": 0.0346, "step": 13360 }, { "epoch": 0.14, "learning_rate": 0.0002783193876889148, "loss": 0.036, "step": 13370 }, { "epoch": 0.14, "learning_rate": 0.0002783031718233119, "loss": 0.041, "step": 13380 }, { "epoch": 0.14, "learning_rate": 0.00027828695595770903, "loss": 0.0397, "step": 13390 }, { "epoch": 0.14, "learning_rate": 0.0002782707400921061, "loss": 0.0341, "step": 13400 }, { "epoch": 0.14, "learning_rate": 0.00027825452422650316, "loss": 0.0313, "step": 13410 }, { "epoch": 0.15, "learning_rate": 0.0002782383083609003, "loss": 0.0329, "step": 13420 }, { "epoch": 0.15, "learning_rate": 0.0002782220924952974, "loss": 0.0845, "step": 13430 }, { "epoch": 0.15, "learning_rate": 0.00027820587662969446, "loss": 0.0418, "step": 13440 }, { "epoch": 0.15, "learning_rate": 0.00027818966076409153, "loss": 0.0442, "step": 13450 }, { "epoch": 0.15, "learning_rate": 0.00027817344489848865, "loss": 0.0336, "step": 13460 }, { "epoch": 0.15, "learning_rate": 0.00027815722903288577, "loss": 0.0342, "step": 13470 }, { "epoch": 0.15, "learning_rate": 0.00027814101316728284, "loss": 0.0341, "step": 13480 }, { "epoch": 0.15, "learning_rate": 0.0002781247973016799, "loss": 0.0334, "step": 13490 }, { "epoch": 0.15, "learning_rate": 0.000278108581436077, "loss": 0.0308, "step": 13500 }, { "epoch": 0.15, "learning_rate": 0.00027809236557047414, "loss": 0.03, "step": 13510 }, { "epoch": 0.15, "learning_rate": 0.0002780761497048712, "loss": 0.0457, "step": 13520 }, { "epoch": 0.15, "learning_rate": 0.0002780599338392683, "loss": 0.0372, "step": 13530 }, { "epoch": 0.15, "learning_rate": 0.0002780437179736654, "loss": 0.0297, "step": 13540 }, { "epoch": 0.15, "learning_rate": 0.0002780275021080625, "loss": 0.0325, "step": 13550 }, { "epoch": 0.15, "learning_rate": 0.00027801128624245963, "loss": 0.0341, "step": 13560 }, { "epoch": 0.15, "learning_rate": 0.0002779950703768567, "loss": 0.0329, "step": 13570 }, { "epoch": 0.15, "learning_rate": 0.00027797885451125376, "loss": 0.0324, "step": 13580 }, { "epoch": 0.15, "learning_rate": 0.0002779626386456509, "loss": 0.029, "step": 13590 }, { "epoch": 0.15, "learning_rate": 0.000277946422780048, "loss": 0.0345, "step": 13600 }, { "epoch": 0.15, "learning_rate": 0.00027793020691444507, "loss": 0.0314, "step": 13610 }, { "epoch": 0.15, "learning_rate": 0.00027791399104884213, "loss": 0.0311, "step": 13620 }, { "epoch": 0.15, "learning_rate": 0.00027789777518323925, "loss": 0.0396, "step": 13630 }, { "epoch": 0.15, "learning_rate": 0.0002778815593176364, "loss": 0.0309, "step": 13640 }, { "epoch": 0.15, "learning_rate": 0.00027786534345203344, "loss": 0.0285, "step": 13650 }, { "epoch": 0.15, "learning_rate": 0.0002778491275864305, "loss": 0.0278, "step": 13660 }, { "epoch": 0.15, "learning_rate": 0.0002778329117208276, "loss": 0.0331, "step": 13670 }, { "epoch": 0.15, "learning_rate": 0.00027781669585522474, "loss": 0.0318, "step": 13680 }, { "epoch": 0.15, "learning_rate": 0.00027780047998962186, "loss": 0.0313, "step": 13690 }, { "epoch": 0.15, "learning_rate": 0.00027778426412401893, "loss": 0.0283, "step": 13700 }, { "epoch": 0.15, "learning_rate": 0.000277768048258416, "loss": 0.035, "step": 13710 }, { "epoch": 0.15, "learning_rate": 0.0002777518323928131, "loss": 0.0304, "step": 13720 }, { "epoch": 0.15, "learning_rate": 0.00027773561652721023, "loss": 0.0354, "step": 13730 }, { "epoch": 0.15, "learning_rate": 0.0002777194006616073, "loss": 0.0344, "step": 13740 }, { "epoch": 0.15, "learning_rate": 0.00027770318479600437, "loss": 0.0348, "step": 13750 }, { "epoch": 0.15, "learning_rate": 0.0002776869689304015, "loss": 0.0328, "step": 13760 }, { "epoch": 0.15, "learning_rate": 0.0002776707530647986, "loss": 0.0368, "step": 13770 }, { "epoch": 0.15, "learning_rate": 0.00027765453719919567, "loss": 0.0342, "step": 13780 }, { "epoch": 0.15, "learning_rate": 0.00027763832133359274, "loss": 0.0268, "step": 13790 }, { "epoch": 0.15, "learning_rate": 0.00027762210546798986, "loss": 0.0298, "step": 13800 }, { "epoch": 0.15, "learning_rate": 0.000277605889602387, "loss": 0.0652, "step": 13810 }, { "epoch": 0.15, "learning_rate": 0.00027758967373678404, "loss": 0.0309, "step": 13820 }, { "epoch": 0.15, "learning_rate": 0.00027757345787118116, "loss": 0.03, "step": 13830 }, { "epoch": 0.15, "learning_rate": 0.00027755724200557823, "loss": 0.0903, "step": 13840 }, { "epoch": 0.15, "learning_rate": 0.00027754102613997535, "loss": 0.0487, "step": 13850 }, { "epoch": 0.15, "learning_rate": 0.0002775248102743724, "loss": 0.0474, "step": 13860 }, { "epoch": 0.15, "learning_rate": 0.00027750859440876953, "loss": 0.0322, "step": 13870 }, { "epoch": 0.15, "learning_rate": 0.0002774923785431666, "loss": 0.0306, "step": 13880 }, { "epoch": 0.15, "learning_rate": 0.0002774761626775637, "loss": 0.1102, "step": 13890 }, { "epoch": 0.15, "learning_rate": 0.0002774599468119608, "loss": 0.0365, "step": 13900 }, { "epoch": 0.15, "learning_rate": 0.0002774437309463579, "loss": 0.0324, "step": 13910 }, { "epoch": 0.15, "learning_rate": 0.00027742751508075497, "loss": 0.0335, "step": 13920 }, { "epoch": 0.15, "learning_rate": 0.0002774112992151521, "loss": 0.033, "step": 13930 }, { "epoch": 0.15, "learning_rate": 0.00027739508334954916, "loss": 0.0327, "step": 13940 }, { "epoch": 0.15, "learning_rate": 0.0002773788674839463, "loss": 0.0316, "step": 13950 }, { "epoch": 0.15, "learning_rate": 0.00027736265161834334, "loss": 0.0322, "step": 13960 }, { "epoch": 0.15, "learning_rate": 0.00027734643575274046, "loss": 0.0365, "step": 13970 }, { "epoch": 0.15, "learning_rate": 0.0002773302198871375, "loss": 0.038, "step": 13980 }, { "epoch": 0.15, "learning_rate": 0.00027731400402153465, "loss": 0.0291, "step": 13990 }, { "epoch": 0.15, "learning_rate": 0.00027729778815593177, "loss": 0.0404, "step": 14000 }, { "epoch": 0.15, "eval_cer": 0.9215990285544536, "eval_loss": 0.023803718388080597, "eval_runtime": 119.9898, "eval_samples_per_second": 16.668, "eval_steps_per_second": 4.167, "step": 14000 }, { "epoch": 0.15, "learning_rate": 0.00027728157229032883, "loss": 0.0351, "step": 14010 }, { "epoch": 0.15, "learning_rate": 0.0002772653564247259, "loss": 0.0353, "step": 14020 }, { "epoch": 0.15, "learning_rate": 0.000277249140559123, "loss": 0.0449, "step": 14030 }, { "epoch": 0.15, "learning_rate": 0.00027723292469352014, "loss": 0.0301, "step": 14040 }, { "epoch": 0.15, "learning_rate": 0.0002772167088279172, "loss": 0.0349, "step": 14050 }, { "epoch": 0.15, "learning_rate": 0.00027720049296231427, "loss": 0.0326, "step": 14060 }, { "epoch": 0.15, "learning_rate": 0.0002771842770967114, "loss": 0.038, "step": 14070 }, { "epoch": 0.15, "learning_rate": 0.0002771680612311085, "loss": 0.0362, "step": 14080 }, { "epoch": 0.15, "learning_rate": 0.0002771518453655056, "loss": 0.0422, "step": 14090 }, { "epoch": 0.15, "learning_rate": 0.0002771356294999027, "loss": 0.0372, "step": 14100 }, { "epoch": 0.15, "learning_rate": 0.00027711941363429976, "loss": 0.0312, "step": 14110 }, { "epoch": 0.15, "learning_rate": 0.0002771031977686969, "loss": 0.0353, "step": 14120 }, { "epoch": 0.15, "learning_rate": 0.000277086981903094, "loss": 0.0319, "step": 14130 }, { "epoch": 0.15, "learning_rate": 0.00027707076603749106, "loss": 0.0296, "step": 14140 }, { "epoch": 0.15, "learning_rate": 0.00027705455017188813, "loss": 0.0347, "step": 14150 }, { "epoch": 0.15, "learning_rate": 0.00027703833430628525, "loss": 0.0341, "step": 14160 }, { "epoch": 0.15, "learning_rate": 0.00027702211844068237, "loss": 0.0296, "step": 14170 }, { "epoch": 0.15, "learning_rate": 0.00027700590257507944, "loss": 0.0322, "step": 14180 }, { "epoch": 0.15, "learning_rate": 0.0002769896867094765, "loss": 0.0292, "step": 14190 }, { "epoch": 0.15, "learning_rate": 0.0002769734708438736, "loss": 0.0294, "step": 14200 }, { "epoch": 0.15, "learning_rate": 0.00027695725497827074, "loss": 0.0348, "step": 14210 }, { "epoch": 0.15, "learning_rate": 0.0002769410391126678, "loss": 0.032, "step": 14220 }, { "epoch": 0.15, "learning_rate": 0.00027692482324706487, "loss": 0.0336, "step": 14230 }, { "epoch": 0.15, "learning_rate": 0.000276908607381462, "loss": 0.0353, "step": 14240 }, { "epoch": 0.15, "learning_rate": 0.0002768923915158591, "loss": 0.0341, "step": 14250 }, { "epoch": 0.15, "learning_rate": 0.0002768761756502562, "loss": 0.0464, "step": 14260 }, { "epoch": 0.15, "learning_rate": 0.0002768599597846533, "loss": 0.0359, "step": 14270 }, { "epoch": 0.15, "learning_rate": 0.00027684374391905036, "loss": 0.0613, "step": 14280 }, { "epoch": 0.15, "learning_rate": 0.0002768275280534475, "loss": 0.0445, "step": 14290 }, { "epoch": 0.15, "learning_rate": 0.00027681131218784455, "loss": 0.0389, "step": 14300 }, { "epoch": 0.15, "learning_rate": 0.00027679509632224167, "loss": 0.0336, "step": 14310 }, { "epoch": 0.15, "learning_rate": 0.00027677888045663873, "loss": 0.0661, "step": 14320 }, { "epoch": 0.15, "learning_rate": 0.00027676266459103585, "loss": 0.0439, "step": 14330 }, { "epoch": 0.16, "learning_rate": 0.0002767464487254329, "loss": 0.0377, "step": 14340 }, { "epoch": 0.16, "learning_rate": 0.00027673023285983004, "loss": 0.0317, "step": 14350 }, { "epoch": 0.16, "learning_rate": 0.0002767140169942271, "loss": 0.032, "step": 14360 }, { "epoch": 0.16, "learning_rate": 0.0002766978011286242, "loss": 0.0305, "step": 14370 }, { "epoch": 0.16, "learning_rate": 0.0002766815852630213, "loss": 0.038, "step": 14380 }, { "epoch": 0.16, "learning_rate": 0.0002766653693974184, "loss": 0.0357, "step": 14390 }, { "epoch": 0.16, "learning_rate": 0.00027664915353181553, "loss": 0.0334, "step": 14400 }, { "epoch": 0.16, "learning_rate": 0.0002766329376662126, "loss": 0.0338, "step": 14410 }, { "epoch": 0.16, "learning_rate": 0.0002766167218006097, "loss": 0.0379, "step": 14420 }, { "epoch": 0.16, "learning_rate": 0.0002766005059350068, "loss": 0.035, "step": 14430 }, { "epoch": 0.16, "learning_rate": 0.0002765842900694039, "loss": 0.0392, "step": 14440 }, { "epoch": 0.16, "learning_rate": 0.00027656807420380097, "loss": 0.0302, "step": 14450 }, { "epoch": 0.16, "learning_rate": 0.0002765518583381981, "loss": 0.035, "step": 14460 }, { "epoch": 0.16, "learning_rate": 0.00027653564247259515, "loss": 0.037, "step": 14470 }, { "epoch": 0.16, "learning_rate": 0.00027651942660699227, "loss": 0.0522, "step": 14480 }, { "epoch": 0.16, "learning_rate": 0.00027650321074138934, "loss": 0.0406, "step": 14490 }, { "epoch": 0.16, "learning_rate": 0.00027648699487578646, "loss": 0.0317, "step": 14500 }, { "epoch": 0.16, "learning_rate": 0.0002764707790101835, "loss": 0.0339, "step": 14510 }, { "epoch": 0.16, "learning_rate": 0.00027645456314458064, "loss": 0.0346, "step": 14520 }, { "epoch": 0.16, "learning_rate": 0.0002764383472789777, "loss": 0.0313, "step": 14530 }, { "epoch": 0.16, "learning_rate": 0.00027642213141337483, "loss": 0.0263, "step": 14540 }, { "epoch": 0.16, "learning_rate": 0.0002764059155477719, "loss": 0.0335, "step": 14550 }, { "epoch": 0.16, "learning_rate": 0.000276389699682169, "loss": 0.0329, "step": 14560 }, { "epoch": 0.16, "learning_rate": 0.00027637348381656613, "loss": 0.0335, "step": 14570 }, { "epoch": 0.16, "learning_rate": 0.0002763572679509632, "loss": 0.0306, "step": 14580 }, { "epoch": 0.16, "learning_rate": 0.00027634105208536027, "loss": 0.0375, "step": 14590 }, { "epoch": 0.16, "learning_rate": 0.0002763248362197574, "loss": 0.0532, "step": 14600 }, { "epoch": 0.16, "learning_rate": 0.0002763086203541545, "loss": 0.0337, "step": 14610 }, { "epoch": 0.16, "learning_rate": 0.00027629240448855157, "loss": 0.0334, "step": 14620 }, { "epoch": 0.16, "learning_rate": 0.00027627618862294864, "loss": 0.0396, "step": 14630 }, { "epoch": 0.16, "learning_rate": 0.00027625997275734576, "loss": 0.0291, "step": 14640 }, { "epoch": 0.16, "learning_rate": 0.0002762437568917429, "loss": 0.0305, "step": 14650 }, { "epoch": 0.16, "learning_rate": 0.00027622754102613994, "loss": 0.0677, "step": 14660 }, { "epoch": 0.16, "learning_rate": 0.000276211325160537, "loss": 0.0329, "step": 14670 }, { "epoch": 0.16, "learning_rate": 0.0002761951092949341, "loss": 0.0365, "step": 14680 }, { "epoch": 0.16, "learning_rate": 0.00027617889342933125, "loss": 0.0316, "step": 14690 }, { "epoch": 0.16, "learning_rate": 0.00027616267756372837, "loss": 0.0329, "step": 14700 }, { "epoch": 0.16, "learning_rate": 0.00027614646169812543, "loss": 0.0299, "step": 14710 }, { "epoch": 0.16, "learning_rate": 0.0002761302458325225, "loss": 0.0351, "step": 14720 }, { "epoch": 0.16, "learning_rate": 0.0002761140299669196, "loss": 0.0327, "step": 14730 }, { "epoch": 0.16, "learning_rate": 0.00027609781410131674, "loss": 0.0282, "step": 14740 }, { "epoch": 0.16, "learning_rate": 0.0002760815982357138, "loss": 0.0343, "step": 14750 }, { "epoch": 0.16, "learning_rate": 0.00027606538237011087, "loss": 0.0454, "step": 14760 }, { "epoch": 0.16, "learning_rate": 0.000276049166504508, "loss": 0.0337, "step": 14770 }, { "epoch": 0.16, "learning_rate": 0.0002760329506389051, "loss": 0.0325, "step": 14780 }, { "epoch": 0.16, "learning_rate": 0.0002760167347733022, "loss": 0.0344, "step": 14790 }, { "epoch": 0.16, "learning_rate": 0.00027600051890769924, "loss": 0.0291, "step": 14800 }, { "epoch": 0.16, "learning_rate": 0.00027598430304209636, "loss": 0.0326, "step": 14810 }, { "epoch": 0.16, "learning_rate": 0.0002759680871764935, "loss": 0.0306, "step": 14820 }, { "epoch": 0.16, "learning_rate": 0.00027595187131089055, "loss": 0.0312, "step": 14830 }, { "epoch": 0.16, "learning_rate": 0.00027593565544528766, "loss": 0.0325, "step": 14840 }, { "epoch": 0.16, "learning_rate": 0.00027591943957968473, "loss": 0.0378, "step": 14850 }, { "epoch": 0.16, "learning_rate": 0.00027590322371408185, "loss": 0.0327, "step": 14860 }, { "epoch": 0.16, "learning_rate": 0.0002758870078484789, "loss": 0.0366, "step": 14870 }, { "epoch": 0.16, "learning_rate": 0.00027587079198287604, "loss": 0.0323, "step": 14880 }, { "epoch": 0.16, "learning_rate": 0.0002758545761172731, "loss": 0.0324, "step": 14890 }, { "epoch": 0.16, "learning_rate": 0.0002758383602516702, "loss": 0.0303, "step": 14900 }, { "epoch": 0.16, "learning_rate": 0.0002758221443860673, "loss": 0.0319, "step": 14910 }, { "epoch": 0.16, "learning_rate": 0.0002758059285204644, "loss": 0.029, "step": 14920 }, { "epoch": 0.16, "learning_rate": 0.00027578971265486147, "loss": 0.0378, "step": 14930 }, { "epoch": 0.16, "learning_rate": 0.0002757734967892586, "loss": 0.0318, "step": 14940 }, { "epoch": 0.16, "learning_rate": 0.00027575728092365566, "loss": 0.0315, "step": 14950 }, { "epoch": 0.16, "learning_rate": 0.0002757410650580528, "loss": 0.0289, "step": 14960 }, { "epoch": 0.16, "learning_rate": 0.00027572484919244984, "loss": 0.028, "step": 14970 }, { "epoch": 0.16, "learning_rate": 0.00027570863332684696, "loss": 0.0338, "step": 14980 }, { "epoch": 0.16, "learning_rate": 0.00027569241746124403, "loss": 0.0344, "step": 14990 }, { "epoch": 0.16, "learning_rate": 0.00027567620159564115, "loss": 0.0265, "step": 15000 }, { "epoch": 0.16, "eval_cer": 0.9216250866431449, "eval_loss": 0.02385568805038929, "eval_runtime": 119.8391, "eval_samples_per_second": 16.689, "eval_steps_per_second": 4.172, "step": 15000 }, { "epoch": 0.16, "learning_rate": 0.00027565998573003827, "loss": 0.0339, "step": 15010 }, { "epoch": 0.16, "learning_rate": 0.00027564376986443533, "loss": 0.033, "step": 15020 }, { "epoch": 0.16, "learning_rate": 0.0002756275539988324, "loss": 0.0324, "step": 15030 }, { "epoch": 0.16, "learning_rate": 0.0002756113381332295, "loss": 0.0325, "step": 15040 }, { "epoch": 0.16, "learning_rate": 0.00027559512226762664, "loss": 0.0323, "step": 15050 }, { "epoch": 0.16, "learning_rate": 0.0002755789064020237, "loss": 0.036, "step": 15060 }, { "epoch": 0.16, "learning_rate": 0.00027556269053642077, "loss": 0.0282, "step": 15070 }, { "epoch": 0.16, "learning_rate": 0.0002755464746708179, "loss": 0.0303, "step": 15080 }, { "epoch": 0.16, "learning_rate": 0.000275530258805215, "loss": 0.0312, "step": 15090 }, { "epoch": 0.16, "learning_rate": 0.0002755140429396121, "loss": 0.0379, "step": 15100 }, { "epoch": 0.16, "learning_rate": 0.0002754978270740092, "loss": 0.0365, "step": 15110 }, { "epoch": 0.16, "learning_rate": 0.00027548161120840626, "loss": 0.0379, "step": 15120 }, { "epoch": 0.16, "learning_rate": 0.0002754653953428034, "loss": 0.0324, "step": 15130 }, { "epoch": 0.16, "learning_rate": 0.0002754491794772005, "loss": 0.0353, "step": 15140 }, { "epoch": 0.16, "learning_rate": 0.00027543296361159757, "loss": 0.0393, "step": 15150 }, { "epoch": 0.16, "learning_rate": 0.00027541674774599463, "loss": 0.0372, "step": 15160 }, { "epoch": 0.16, "learning_rate": 0.00027540053188039175, "loss": 0.0328, "step": 15170 }, { "epoch": 0.16, "learning_rate": 0.00027538431601478887, "loss": 0.0334, "step": 15180 }, { "epoch": 0.16, "learning_rate": 0.00027536810014918594, "loss": 0.0279, "step": 15190 }, { "epoch": 0.16, "learning_rate": 0.000275351884283583, "loss": 0.0302, "step": 15200 }, { "epoch": 0.16, "learning_rate": 0.0002753356684179801, "loss": 0.0296, "step": 15210 }, { "epoch": 0.16, "learning_rate": 0.00027531945255237724, "loss": 0.0283, "step": 15220 }, { "epoch": 0.16, "learning_rate": 0.0002753032366867743, "loss": 0.0309, "step": 15230 }, { "epoch": 0.16, "learning_rate": 0.0002752870208211714, "loss": 0.0319, "step": 15240 }, { "epoch": 0.16, "learning_rate": 0.0002752708049555685, "loss": 0.0311, "step": 15250 }, { "epoch": 0.16, "learning_rate": 0.0002752545890899656, "loss": 0.032, "step": 15260 }, { "epoch": 0.17, "learning_rate": 0.0002752383732243627, "loss": 0.0331, "step": 15270 }, { "epoch": 0.17, "learning_rate": 0.0002752221573587598, "loss": 0.0332, "step": 15280 }, { "epoch": 0.17, "learning_rate": 0.00027520594149315687, "loss": 0.0326, "step": 15290 }, { "epoch": 0.17, "learning_rate": 0.000275189725627554, "loss": 0.0321, "step": 15300 }, { "epoch": 0.17, "learning_rate": 0.0002751735097619511, "loss": 0.0314, "step": 15310 }, { "epoch": 0.17, "learning_rate": 0.00027515729389634817, "loss": 0.0362, "step": 15320 }, { "epoch": 0.17, "learning_rate": 0.00027514107803074524, "loss": 0.0332, "step": 15330 }, { "epoch": 0.17, "learning_rate": 0.00027512486216514236, "loss": 0.0332, "step": 15340 }, { "epoch": 0.17, "learning_rate": 0.0002751086462995395, "loss": 0.0323, "step": 15350 }, { "epoch": 0.17, "learning_rate": 0.00027509243043393654, "loss": 0.0311, "step": 15360 }, { "epoch": 0.17, "learning_rate": 0.0002750762145683336, "loss": 0.0361, "step": 15370 }, { "epoch": 0.17, "learning_rate": 0.00027505999870273073, "loss": 0.0292, "step": 15380 }, { "epoch": 0.17, "learning_rate": 0.00027504378283712785, "loss": 0.0363, "step": 15390 }, { "epoch": 0.17, "learning_rate": 0.0002750275669715249, "loss": 0.0298, "step": 15400 }, { "epoch": 0.17, "learning_rate": 0.00027501135110592203, "loss": 0.0325, "step": 15410 }, { "epoch": 0.17, "learning_rate": 0.0002749951352403191, "loss": 0.0326, "step": 15420 }, { "epoch": 0.17, "learning_rate": 0.0002749789193747162, "loss": 0.0287, "step": 15430 }, { "epoch": 0.17, "learning_rate": 0.0002749627035091133, "loss": 0.0327, "step": 15440 }, { "epoch": 0.17, "learning_rate": 0.0002749464876435104, "loss": 0.0345, "step": 15450 }, { "epoch": 0.17, "learning_rate": 0.00027493027177790747, "loss": 0.0315, "step": 15460 }, { "epoch": 0.17, "learning_rate": 0.0002749140559123046, "loss": 0.0324, "step": 15470 }, { "epoch": 0.17, "learning_rate": 0.00027489784004670165, "loss": 0.0285, "step": 15480 }, { "epoch": 0.17, "learning_rate": 0.0002748816241810988, "loss": 0.0358, "step": 15490 }, { "epoch": 0.17, "learning_rate": 0.00027486540831549584, "loss": 0.0278, "step": 15500 }, { "epoch": 0.17, "learning_rate": 0.00027484919244989296, "loss": 0.0274, "step": 15510 }, { "epoch": 0.17, "learning_rate": 0.00027483297658429, "loss": 0.0288, "step": 15520 }, { "epoch": 0.17, "learning_rate": 0.00027481676071868715, "loss": 0.0287, "step": 15530 }, { "epoch": 0.17, "learning_rate": 0.0002748005448530842, "loss": 0.0304, "step": 15540 }, { "epoch": 0.17, "learning_rate": 0.00027478432898748133, "loss": 0.0296, "step": 15550 }, { "epoch": 0.17, "learning_rate": 0.0002747681131218784, "loss": 0.0351, "step": 15560 }, { "epoch": 0.17, "learning_rate": 0.0002747518972562755, "loss": 0.0388, "step": 15570 }, { "epoch": 0.17, "learning_rate": 0.00027473568139067264, "loss": 0.0285, "step": 15580 }, { "epoch": 0.17, "learning_rate": 0.0002747194655250697, "loss": 0.0303, "step": 15590 }, { "epoch": 0.17, "learning_rate": 0.00027470324965946677, "loss": 0.034, "step": 15600 }, { "epoch": 0.17, "learning_rate": 0.0002746870337938639, "loss": 0.034, "step": 15610 }, { "epoch": 0.17, "learning_rate": 0.000274670817928261, "loss": 0.0346, "step": 15620 }, { "epoch": 0.17, "learning_rate": 0.0002746546020626581, "loss": 0.0328, "step": 15630 }, { "epoch": 0.17, "learning_rate": 0.00027463838619705514, "loss": 0.0349, "step": 15640 }, { "epoch": 0.17, "learning_rate": 0.00027462217033145226, "loss": 0.0416, "step": 15650 }, { "epoch": 0.17, "learning_rate": 0.0002746059544658494, "loss": 0.0331, "step": 15660 }, { "epoch": 0.17, "learning_rate": 0.00027458973860024644, "loss": 0.0298, "step": 15670 }, { "epoch": 0.17, "learning_rate": 0.0002745735227346435, "loss": 0.032, "step": 15680 }, { "epoch": 0.17, "learning_rate": 0.00027455730686904063, "loss": 0.0292, "step": 15690 }, { "epoch": 0.17, "learning_rate": 0.00027454109100343775, "loss": 0.0345, "step": 15700 }, { "epoch": 0.17, "learning_rate": 0.00027452487513783487, "loss": 0.0346, "step": 15710 }, { "epoch": 0.17, "learning_rate": 0.00027450865927223193, "loss": 0.0345, "step": 15720 }, { "epoch": 0.17, "learning_rate": 0.000274492443406629, "loss": 0.0314, "step": 15730 }, { "epoch": 0.17, "learning_rate": 0.0002744762275410261, "loss": 0.0317, "step": 15740 }, { "epoch": 0.17, "learning_rate": 0.00027446001167542324, "loss": 0.0286, "step": 15750 }, { "epoch": 0.17, "learning_rate": 0.0002744437958098203, "loss": 0.0296, "step": 15760 }, { "epoch": 0.17, "learning_rate": 0.00027442757994421737, "loss": 0.0315, "step": 15770 }, { "epoch": 0.17, "learning_rate": 0.0002744113640786145, "loss": 0.035, "step": 15780 }, { "epoch": 0.17, "learning_rate": 0.0002743951482130116, "loss": 0.0319, "step": 15790 }, { "epoch": 0.17, "learning_rate": 0.0002743789323474087, "loss": 0.0354, "step": 15800 }, { "epoch": 0.17, "learning_rate": 0.00027436271648180574, "loss": 0.0364, "step": 15810 }, { "epoch": 0.17, "learning_rate": 0.00027434650061620286, "loss": 0.0324, "step": 15820 }, { "epoch": 0.17, "learning_rate": 0.0002743302847506, "loss": 0.0357, "step": 15830 }, { "epoch": 0.17, "learning_rate": 0.00027431406888499705, "loss": 0.0317, "step": 15840 }, { "epoch": 0.17, "learning_rate": 0.00027429785301939417, "loss": 0.0329, "step": 15850 }, { "epoch": 0.17, "learning_rate": 0.00027428163715379123, "loss": 0.0335, "step": 15860 }, { "epoch": 0.17, "learning_rate": 0.00027426542128818835, "loss": 0.0265, "step": 15870 }, { "epoch": 0.17, "learning_rate": 0.0002742492054225855, "loss": 0.0319, "step": 15880 }, { "epoch": 0.17, "learning_rate": 0.00027423298955698254, "loss": 0.032, "step": 15890 }, { "epoch": 0.17, "learning_rate": 0.0002742167736913796, "loss": 0.0304, "step": 15900 }, { "epoch": 0.17, "learning_rate": 0.0002742005578257767, "loss": 0.0297, "step": 15910 }, { "epoch": 0.17, "learning_rate": 0.00027418434196017384, "loss": 0.031, "step": 15920 }, { "epoch": 0.17, "learning_rate": 0.0002741681260945709, "loss": 0.0281, "step": 15930 }, { "epoch": 0.17, "learning_rate": 0.000274151910228968, "loss": 0.0323, "step": 15940 }, { "epoch": 0.17, "learning_rate": 0.0002741356943633651, "loss": 0.0321, "step": 15950 }, { "epoch": 0.17, "learning_rate": 0.0002741194784977622, "loss": 0.0306, "step": 15960 }, { "epoch": 0.17, "learning_rate": 0.0002741032626321593, "loss": 0.0321, "step": 15970 }, { "epoch": 0.17, "learning_rate": 0.00027408704676655635, "loss": 0.0297, "step": 15980 }, { "epoch": 0.17, "learning_rate": 0.00027407083090095347, "loss": 0.0311, "step": 15990 }, { "epoch": 0.17, "learning_rate": 0.0002740546150353506, "loss": 0.029, "step": 16000 }, { "epoch": 0.17, "eval_cer": 0.9216103203928865, "eval_loss": 0.02347717247903347, "eval_runtime": 120.1178, "eval_samples_per_second": 16.65, "eval_steps_per_second": 4.163, "step": 16000 }, { "epoch": 0.17, "learning_rate": 0.00027403839916974765, "loss": 0.0309, "step": 16010 }, { "epoch": 0.17, "learning_rate": 0.00027402218330414477, "loss": 0.0301, "step": 16020 }, { "epoch": 0.17, "learning_rate": 0.00027400596743854184, "loss": 0.0358, "step": 16030 }, { "epoch": 0.17, "learning_rate": 0.00027398975157293896, "loss": 0.0314, "step": 16040 }, { "epoch": 0.17, "learning_rate": 0.000273973535707336, "loss": 0.03, "step": 16050 }, { "epoch": 0.17, "learning_rate": 0.00027395731984173314, "loss": 0.0341, "step": 16060 }, { "epoch": 0.17, "learning_rate": 0.0002739411039761302, "loss": 0.0302, "step": 16070 }, { "epoch": 0.17, "learning_rate": 0.00027392488811052733, "loss": 0.0337, "step": 16080 }, { "epoch": 0.17, "learning_rate": 0.0002739086722449244, "loss": 0.0294, "step": 16090 }, { "epoch": 0.17, "learning_rate": 0.0002738924563793215, "loss": 0.0294, "step": 16100 }, { "epoch": 0.17, "learning_rate": 0.0002738762405137186, "loss": 0.0283, "step": 16110 }, { "epoch": 0.17, "learning_rate": 0.0002738600246481157, "loss": 0.0338, "step": 16120 }, { "epoch": 0.17, "learning_rate": 0.00027384380878251276, "loss": 0.027, "step": 16130 }, { "epoch": 0.17, "learning_rate": 0.0002738275929169099, "loss": 0.0294, "step": 16140 }, { "epoch": 0.17, "learning_rate": 0.000273811377051307, "loss": 0.0278, "step": 16150 }, { "epoch": 0.17, "learning_rate": 0.00027379516118570407, "loss": 0.0272, "step": 16160 }, { "epoch": 0.17, "learning_rate": 0.00027377894532010114, "loss": 0.0295, "step": 16170 }, { "epoch": 0.17, "learning_rate": 0.00027376272945449826, "loss": 0.0292, "step": 16180 }, { "epoch": 0.18, "learning_rate": 0.0002737465135888954, "loss": 0.0307, "step": 16190 }, { "epoch": 0.18, "learning_rate": 0.00027373029772329244, "loss": 0.0276, "step": 16200 }, { "epoch": 0.18, "learning_rate": 0.0002737140818576895, "loss": 0.0327, "step": 16210 }, { "epoch": 0.18, "learning_rate": 0.0002736978659920866, "loss": 0.0308, "step": 16220 }, { "epoch": 0.18, "learning_rate": 0.00027368165012648375, "loss": 0.0306, "step": 16230 }, { "epoch": 0.18, "learning_rate": 0.0002736654342608808, "loss": 0.0286, "step": 16240 }, { "epoch": 0.18, "learning_rate": 0.0002736492183952779, "loss": 0.028, "step": 16250 }, { "epoch": 0.18, "learning_rate": 0.000273633002529675, "loss": 0.0331, "step": 16260 }, { "epoch": 0.18, "learning_rate": 0.0002736167866640721, "loss": 0.0309, "step": 16270 }, { "epoch": 0.18, "learning_rate": 0.0002736005707984692, "loss": 0.0292, "step": 16280 }, { "epoch": 0.18, "learning_rate": 0.0002735843549328663, "loss": 0.0277, "step": 16290 }, { "epoch": 0.18, "learning_rate": 0.00027356813906726337, "loss": 0.0296, "step": 16300 }, { "epoch": 0.18, "learning_rate": 0.0002735519232016605, "loss": 0.0283, "step": 16310 }, { "epoch": 0.18, "learning_rate": 0.0002735357073360576, "loss": 0.0332, "step": 16320 }, { "epoch": 0.18, "learning_rate": 0.0002735194914704547, "loss": 0.0277, "step": 16330 }, { "epoch": 0.18, "learning_rate": 0.00027350327560485174, "loss": 0.0307, "step": 16340 }, { "epoch": 0.18, "learning_rate": 0.00027348705973924886, "loss": 0.0331, "step": 16350 }, { "epoch": 0.18, "learning_rate": 0.000273470843873646, "loss": 0.0316, "step": 16360 }, { "epoch": 0.18, "learning_rate": 0.00027345462800804304, "loss": 0.0305, "step": 16370 }, { "epoch": 0.18, "learning_rate": 0.0002734384121424401, "loss": 0.0228, "step": 16380 }, { "epoch": 0.18, "learning_rate": 0.00027342219627683723, "loss": 0.0338, "step": 16390 }, { "epoch": 0.18, "learning_rate": 0.00027340598041123435, "loss": 0.0278, "step": 16400 }, { "epoch": 0.18, "learning_rate": 0.0002733897645456314, "loss": 0.0294, "step": 16410 }, { "epoch": 0.18, "learning_rate": 0.00027337354868002854, "loss": 0.0287, "step": 16420 }, { "epoch": 0.18, "learning_rate": 0.0002733573328144256, "loss": 0.0274, "step": 16430 }, { "epoch": 0.18, "learning_rate": 0.0002733411169488227, "loss": 0.0263, "step": 16440 }, { "epoch": 0.18, "learning_rate": 0.0002733249010832198, "loss": 0.0297, "step": 16450 }, { "epoch": 0.18, "learning_rate": 0.0002733086852176169, "loss": 0.0244, "step": 16460 }, { "epoch": 0.18, "learning_rate": 0.00027329246935201397, "loss": 0.0282, "step": 16470 }, { "epoch": 0.18, "learning_rate": 0.0002732762534864111, "loss": 0.0302, "step": 16480 }, { "epoch": 0.18, "learning_rate": 0.00027326003762080816, "loss": 0.0302, "step": 16490 }, { "epoch": 0.18, "learning_rate": 0.0002732438217552053, "loss": 0.0384, "step": 16500 }, { "epoch": 0.18, "learning_rate": 0.00027322760588960234, "loss": 0.0252, "step": 16510 }, { "epoch": 0.18, "learning_rate": 0.00027321139002399946, "loss": 0.0272, "step": 16520 }, { "epoch": 0.18, "learning_rate": 0.00027319517415839653, "loss": 0.0322, "step": 16530 }, { "epoch": 0.18, "learning_rate": 0.00027317895829279365, "loss": 0.0287, "step": 16540 }, { "epoch": 0.18, "learning_rate": 0.0002731627424271907, "loss": 0.0313, "step": 16550 }, { "epoch": 0.18, "learning_rate": 0.00027314652656158783, "loss": 0.0275, "step": 16560 }, { "epoch": 0.18, "learning_rate": 0.00027313031069598495, "loss": 0.0295, "step": 16570 }, { "epoch": 0.18, "learning_rate": 0.000273114094830382, "loss": 0.0264, "step": 16580 }, { "epoch": 0.18, "learning_rate": 0.00027309787896477914, "loss": 0.0277, "step": 16590 }, { "epoch": 0.18, "learning_rate": 0.0002730816630991762, "loss": 0.0264, "step": 16600 }, { "epoch": 0.18, "learning_rate": 0.0002730654472335733, "loss": 0.0329, "step": 16610 }, { "epoch": 0.18, "learning_rate": 0.0002730492313679704, "loss": 0.031, "step": 16620 }, { "epoch": 0.18, "learning_rate": 0.0002730330155023675, "loss": 0.0309, "step": 16630 }, { "epoch": 0.18, "learning_rate": 0.0002730167996367646, "loss": 0.0347, "step": 16640 }, { "epoch": 0.18, "learning_rate": 0.0002730005837711617, "loss": 0.0328, "step": 16650 }, { "epoch": 0.18, "learning_rate": 0.00027298436790555876, "loss": 0.0301, "step": 16660 }, { "epoch": 0.18, "learning_rate": 0.0002729681520399559, "loss": 0.0338, "step": 16670 }, { "epoch": 0.18, "learning_rate": 0.00027295193617435295, "loss": 0.0308, "step": 16680 }, { "epoch": 0.18, "learning_rate": 0.00027293572030875007, "loss": 0.0322, "step": 16690 }, { "epoch": 0.18, "learning_rate": 0.00027291950444314713, "loss": 0.0375, "step": 16700 }, { "epoch": 0.18, "learning_rate": 0.00027290328857754425, "loss": 0.0334, "step": 16710 }, { "epoch": 0.18, "learning_rate": 0.00027288707271194137, "loss": 0.0394, "step": 16720 }, { "epoch": 0.18, "learning_rate": 0.00027287085684633844, "loss": 0.0323, "step": 16730 }, { "epoch": 0.18, "learning_rate": 0.0002728546409807355, "loss": 0.0281, "step": 16740 }, { "epoch": 0.18, "learning_rate": 0.0002728384251151326, "loss": 0.036, "step": 16750 }, { "epoch": 0.18, "learning_rate": 0.00027282220924952974, "loss": 0.033, "step": 16760 }, { "epoch": 0.18, "learning_rate": 0.0002728059933839268, "loss": 0.0298, "step": 16770 }, { "epoch": 0.18, "learning_rate": 0.0002727897775183239, "loss": 0.0264, "step": 16780 }, { "epoch": 0.18, "learning_rate": 0.000272773561652721, "loss": 0.0288, "step": 16790 }, { "epoch": 0.18, "learning_rate": 0.0002727573457871181, "loss": 0.034, "step": 16800 }, { "epoch": 0.18, "learning_rate": 0.0002727411299215152, "loss": 0.0326, "step": 16810 }, { "epoch": 0.18, "learning_rate": 0.00027272491405591225, "loss": 0.0315, "step": 16820 }, { "epoch": 0.18, "learning_rate": 0.00027270869819030936, "loss": 0.0299, "step": 16830 }, { "epoch": 0.18, "learning_rate": 0.0002726924823247065, "loss": 0.0281, "step": 16840 }, { "epoch": 0.18, "learning_rate": 0.00027267626645910355, "loss": 0.0285, "step": 16850 }, { "epoch": 0.18, "learning_rate": 0.00027266005059350067, "loss": 0.0273, "step": 16860 }, { "epoch": 0.18, "learning_rate": 0.00027264383472789774, "loss": 0.0305, "step": 16870 }, { "epoch": 0.18, "learning_rate": 0.00027262761886229486, "loss": 0.0282, "step": 16880 }, { "epoch": 0.18, "learning_rate": 0.000272611402996692, "loss": 0.0279, "step": 16890 }, { "epoch": 0.18, "learning_rate": 0.00027259518713108904, "loss": 0.0337, "step": 16900 }, { "epoch": 0.18, "learning_rate": 0.0002725789712654861, "loss": 0.0309, "step": 16910 }, { "epoch": 0.18, "learning_rate": 0.0002725627553998832, "loss": 0.0318, "step": 16920 }, { "epoch": 0.18, "learning_rate": 0.00027254653953428035, "loss": 0.0355, "step": 16930 }, { "epoch": 0.18, "learning_rate": 0.0002725303236686774, "loss": 0.0271, "step": 16940 }, { "epoch": 0.18, "learning_rate": 0.0002725141078030745, "loss": 0.0278, "step": 16950 }, { "epoch": 0.18, "learning_rate": 0.0002724978919374716, "loss": 0.0326, "step": 16960 }, { "epoch": 0.18, "learning_rate": 0.0002724816760718687, "loss": 0.0257, "step": 16970 }, { "epoch": 0.18, "learning_rate": 0.0002724654602062658, "loss": 0.0303, "step": 16980 }, { "epoch": 0.18, "learning_rate": 0.00027244924434066285, "loss": 0.0271, "step": 16990 }, { "epoch": 0.18, "learning_rate": 0.00027243302847505997, "loss": 0.0295, "step": 17000 }, { "epoch": 0.18, "eval_cer": 0.9216494075259235, "eval_loss": 0.021790610626339912, "eval_runtime": 120.0679, "eval_samples_per_second": 16.657, "eval_steps_per_second": 4.164, "step": 17000 }, { "epoch": 0.18, "learning_rate": 0.0002724168126094571, "loss": 0.0334, "step": 17010 }, { "epoch": 0.18, "learning_rate": 0.00027240059674385415, "loss": 0.0319, "step": 17020 }, { "epoch": 0.18, "learning_rate": 0.0002723843808782513, "loss": 0.0292, "step": 17030 }, { "epoch": 0.18, "learning_rate": 0.00027236816501264834, "loss": 0.0341, "step": 17040 }, { "epoch": 0.18, "learning_rate": 0.00027235194914704546, "loss": 0.0303, "step": 17050 }, { "epoch": 0.18, "learning_rate": 0.0002723357332814425, "loss": 0.0326, "step": 17060 }, { "epoch": 0.18, "learning_rate": 0.00027231951741583964, "loss": 0.0292, "step": 17070 }, { "epoch": 0.18, "learning_rate": 0.0002723033015502367, "loss": 0.0256, "step": 17080 }, { "epoch": 0.18, "learning_rate": 0.00027228708568463383, "loss": 0.0246, "step": 17090 }, { "epoch": 0.18, "learning_rate": 0.0002722708698190309, "loss": 0.0276, "step": 17100 }, { "epoch": 0.18, "learning_rate": 0.000272254653953428, "loss": 0.0272, "step": 17110 }, { "epoch": 0.19, "learning_rate": 0.0002722384380878251, "loss": 0.0291, "step": 17120 }, { "epoch": 0.19, "learning_rate": 0.0002722222222222222, "loss": 0.0249, "step": 17130 }, { "epoch": 0.19, "learning_rate": 0.00027220600635661927, "loss": 0.0268, "step": 17140 }, { "epoch": 0.19, "learning_rate": 0.0002721897904910164, "loss": 0.0273, "step": 17150 }, { "epoch": 0.19, "learning_rate": 0.0002721735746254135, "loss": 0.029, "step": 17160 }, { "epoch": 0.19, "learning_rate": 0.00027215735875981057, "loss": 0.0338, "step": 17170 }, { "epoch": 0.19, "learning_rate": 0.00027214114289420764, "loss": 0.0339, "step": 17180 }, { "epoch": 0.19, "learning_rate": 0.00027212492702860476, "loss": 0.032, "step": 17190 }, { "epoch": 0.19, "learning_rate": 0.0002721087111630019, "loss": 0.0319, "step": 17200 }, { "epoch": 0.19, "learning_rate": 0.00027209249529739894, "loss": 0.0308, "step": 17210 }, { "epoch": 0.19, "learning_rate": 0.000272076279431796, "loss": 0.0342, "step": 17220 }, { "epoch": 0.19, "learning_rate": 0.00027206006356619313, "loss": 0.0278, "step": 17230 }, { "epoch": 0.19, "learning_rate": 0.00027204384770059025, "loss": 0.031, "step": 17240 }, { "epoch": 0.19, "learning_rate": 0.0002720276318349873, "loss": 0.0281, "step": 17250 }, { "epoch": 0.19, "learning_rate": 0.0002720114159693844, "loss": 0.0314, "step": 17260 }, { "epoch": 0.19, "learning_rate": 0.0002719952001037815, "loss": 0.0278, "step": 17270 }, { "epoch": 0.19, "learning_rate": 0.0002719789842381786, "loss": 0.0343, "step": 17280 }, { "epoch": 0.19, "learning_rate": 0.0002719627683725757, "loss": 0.0292, "step": 17290 }, { "epoch": 0.19, "learning_rate": 0.0002719465525069728, "loss": 0.0296, "step": 17300 }, { "epoch": 0.19, "learning_rate": 0.00027193033664136987, "loss": 0.0295, "step": 17310 }, { "epoch": 0.19, "learning_rate": 0.000271914120775767, "loss": 0.0279, "step": 17320 }, { "epoch": 0.19, "learning_rate": 0.0002718979049101641, "loss": 0.0334, "step": 17330 }, { "epoch": 0.19, "learning_rate": 0.0002718816890445612, "loss": 0.0357, "step": 17340 }, { "epoch": 0.19, "learning_rate": 0.00027186547317895824, "loss": 0.0301, "step": 17350 }, { "epoch": 0.19, "learning_rate": 0.00027184925731335536, "loss": 0.0285, "step": 17360 }, { "epoch": 0.19, "learning_rate": 0.0002718330414477525, "loss": 0.0282, "step": 17370 }, { "epoch": 0.19, "learning_rate": 0.00027181682558214955, "loss": 0.0299, "step": 17380 }, { "epoch": 0.19, "learning_rate": 0.0002718006097165466, "loss": 0.0262, "step": 17390 }, { "epoch": 0.19, "learning_rate": 0.00027178439385094373, "loss": 0.0243, "step": 17400 }, { "epoch": 0.19, "learning_rate": 0.00027176817798534085, "loss": 0.0284, "step": 17410 }, { "epoch": 0.19, "learning_rate": 0.0002717519621197379, "loss": 0.0294, "step": 17420 }, { "epoch": 0.19, "learning_rate": 0.00027173574625413504, "loss": 0.0262, "step": 17430 }, { "epoch": 0.19, "learning_rate": 0.0002717195303885321, "loss": 0.0241, "step": 17440 }, { "epoch": 0.19, "learning_rate": 0.0002717033145229292, "loss": 0.0274, "step": 17450 }, { "epoch": 0.19, "learning_rate": 0.00027168709865732634, "loss": 0.034, "step": 17460 }, { "epoch": 0.19, "learning_rate": 0.0002716708827917234, "loss": 0.0303, "step": 17470 }, { "epoch": 0.19, "learning_rate": 0.0002716546669261205, "loss": 0.0311, "step": 17480 }, { "epoch": 0.19, "learning_rate": 0.0002716384510605176, "loss": 0.0303, "step": 17490 }, { "epoch": 0.19, "learning_rate": 0.0002716222351949147, "loss": 0.0298, "step": 17500 }, { "epoch": 0.19, "learning_rate": 0.0002716060193293118, "loss": 0.0251, "step": 17510 }, { "epoch": 0.19, "learning_rate": 0.00027158980346370885, "loss": 0.0316, "step": 17520 }, { "epoch": 0.19, "learning_rate": 0.00027157358759810597, "loss": 0.0299, "step": 17530 }, { "epoch": 0.19, "learning_rate": 0.0002715573717325031, "loss": 0.0294, "step": 17540 }, { "epoch": 0.19, "learning_rate": 0.00027154115586690015, "loss": 0.0302, "step": 17550 }, { "epoch": 0.19, "learning_rate": 0.0002715249400012972, "loss": 0.0296, "step": 17560 }, { "epoch": 0.19, "learning_rate": 0.00027150872413569434, "loss": 0.0295, "step": 17570 }, { "epoch": 0.19, "learning_rate": 0.00027149250827009146, "loss": 0.0317, "step": 17580 }, { "epoch": 0.19, "learning_rate": 0.0002714762924044885, "loss": 0.0344, "step": 17590 }, { "epoch": 0.19, "learning_rate": 0.00027146007653888564, "loss": 0.0359, "step": 17600 }, { "epoch": 0.19, "learning_rate": 0.0002714438606732827, "loss": 0.0316, "step": 17610 }, { "epoch": 0.19, "learning_rate": 0.00027142764480767983, "loss": 0.0295, "step": 17620 }, { "epoch": 0.19, "learning_rate": 0.0002714114289420769, "loss": 0.0304, "step": 17630 }, { "epoch": 0.19, "learning_rate": 0.000271395213076474, "loss": 0.0268, "step": 17640 }, { "epoch": 0.19, "learning_rate": 0.0002713789972108711, "loss": 0.0254, "step": 17650 }, { "epoch": 0.19, "learning_rate": 0.0002713627813452682, "loss": 0.0326, "step": 17660 }, { "epoch": 0.19, "learning_rate": 0.00027134656547966526, "loss": 0.0259, "step": 17670 }, { "epoch": 0.19, "learning_rate": 0.0002713303496140624, "loss": 0.025, "step": 17680 }, { "epoch": 0.19, "learning_rate": 0.00027131413374845945, "loss": 0.0314, "step": 17690 }, { "epoch": 0.19, "learning_rate": 0.00027129791788285657, "loss": 0.0261, "step": 17700 }, { "epoch": 0.19, "learning_rate": 0.00027128170201725363, "loss": 0.0258, "step": 17710 }, { "epoch": 0.19, "learning_rate": 0.00027126548615165075, "loss": 0.0327, "step": 17720 }, { "epoch": 0.19, "learning_rate": 0.0002712492702860479, "loss": 0.033, "step": 17730 }, { "epoch": 0.19, "learning_rate": 0.00027123305442044494, "loss": 0.0284, "step": 17740 }, { "epoch": 0.19, "learning_rate": 0.000271216838554842, "loss": 0.0336, "step": 17750 }, { "epoch": 0.19, "learning_rate": 0.0002712006226892391, "loss": 0.0324, "step": 17760 }, { "epoch": 0.19, "learning_rate": 0.00027118440682363625, "loss": 0.0343, "step": 17770 }, { "epoch": 0.19, "learning_rate": 0.0002711681909580333, "loss": 0.0284, "step": 17780 }, { "epoch": 0.19, "learning_rate": 0.0002711519750924304, "loss": 0.0307, "step": 17790 }, { "epoch": 0.19, "learning_rate": 0.0002711357592268275, "loss": 0.0303, "step": 17800 }, { "epoch": 0.19, "learning_rate": 0.0002711195433612246, "loss": 0.0314, "step": 17810 }, { "epoch": 0.19, "learning_rate": 0.0002711033274956217, "loss": 0.0289, "step": 17820 }, { "epoch": 0.19, "learning_rate": 0.00027108711163001875, "loss": 0.031, "step": 17830 }, { "epoch": 0.19, "learning_rate": 0.00027107089576441587, "loss": 0.0281, "step": 17840 }, { "epoch": 0.19, "learning_rate": 0.000271054679898813, "loss": 0.0289, "step": 17850 }, { "epoch": 0.19, "learning_rate": 0.00027103846403321005, "loss": 0.0322, "step": 17860 }, { "epoch": 0.19, "learning_rate": 0.00027102224816760717, "loss": 0.0311, "step": 17870 }, { "epoch": 0.19, "learning_rate": 0.00027100603230200424, "loss": 0.0267, "step": 17880 }, { "epoch": 0.19, "learning_rate": 0.00027098981643640136, "loss": 0.0296, "step": 17890 }, { "epoch": 0.19, "learning_rate": 0.0002709736005707985, "loss": 0.0268, "step": 17900 }, { "epoch": 0.19, "learning_rate": 0.00027095738470519554, "loss": 0.0301, "step": 17910 }, { "epoch": 0.19, "learning_rate": 0.0002709411688395926, "loss": 0.0321, "step": 17920 }, { "epoch": 0.19, "learning_rate": 0.00027092495297398973, "loss": 0.0308, "step": 17930 }, { "epoch": 0.19, "learning_rate": 0.00027090873710838685, "loss": 0.0323, "step": 17940 }, { "epoch": 0.19, "learning_rate": 0.0002708925212427839, "loss": 0.0281, "step": 17950 }, { "epoch": 0.19, "learning_rate": 0.000270876305377181, "loss": 0.0328, "step": 17960 }, { "epoch": 0.19, "learning_rate": 0.0002708600895115781, "loss": 0.0306, "step": 17970 }, { "epoch": 0.19, "learning_rate": 0.0002708438736459752, "loss": 0.0327, "step": 17980 }, { "epoch": 0.19, "learning_rate": 0.0002708276577803723, "loss": 0.0224, "step": 17990 }, { "epoch": 0.19, "learning_rate": 0.00027081144191476935, "loss": 0.0262, "step": 18000 }, { "epoch": 0.19, "eval_cer": 0.921588605318977, "eval_loss": 0.021395886316895485, "eval_runtime": 120.389, "eval_samples_per_second": 16.613, "eval_steps_per_second": 4.153, "step": 18000 }, { "epoch": 0.19, "learning_rate": 0.00027079522604916647, "loss": 0.0273, "step": 18010 }, { "epoch": 0.19, "learning_rate": 0.0002707790101835636, "loss": 0.0335, "step": 18020 }, { "epoch": 0.19, "learning_rate": 0.0002707627943179607, "loss": 0.0313, "step": 18030 }, { "epoch": 0.2, "learning_rate": 0.0002707465784523578, "loss": 0.0303, "step": 18040 }, { "epoch": 0.2, "learning_rate": 0.00027073036258675484, "loss": 0.0289, "step": 18050 }, { "epoch": 0.2, "learning_rate": 0.00027071414672115196, "loss": 0.0297, "step": 18060 }, { "epoch": 0.2, "learning_rate": 0.0002706979308555491, "loss": 0.0343, "step": 18070 }, { "epoch": 0.2, "learning_rate": 0.00027068171498994615, "loss": 0.0283, "step": 18080 }, { "epoch": 0.2, "learning_rate": 0.0002706654991243432, "loss": 0.0266, "step": 18090 }, { "epoch": 0.2, "learning_rate": 0.00027064928325874033, "loss": 0.0344, "step": 18100 }, { "epoch": 0.2, "learning_rate": 0.00027063306739313745, "loss": 0.0289, "step": 18110 }, { "epoch": 0.2, "learning_rate": 0.0002706168515275345, "loss": 0.0265, "step": 18120 }, { "epoch": 0.2, "learning_rate": 0.0002706006356619316, "loss": 0.0344, "step": 18130 }, { "epoch": 0.2, "learning_rate": 0.0002705844197963287, "loss": 0.029, "step": 18140 }, { "epoch": 0.2, "learning_rate": 0.0002705682039307258, "loss": 0.0281, "step": 18150 }, { "epoch": 0.2, "learning_rate": 0.0002705519880651229, "loss": 0.026, "step": 18160 }, { "epoch": 0.2, "learning_rate": 0.00027053577219952, "loss": 0.0273, "step": 18170 }, { "epoch": 0.2, "learning_rate": 0.0002705195563339171, "loss": 0.0317, "step": 18180 }, { "epoch": 0.2, "learning_rate": 0.0002705033404683142, "loss": 0.0317, "step": 18190 }, { "epoch": 0.2, "learning_rate": 0.00027048712460271126, "loss": 0.0288, "step": 18200 }, { "epoch": 0.2, "learning_rate": 0.0002704709087371084, "loss": 0.0235, "step": 18210 }, { "epoch": 0.2, "learning_rate": 0.00027045469287150545, "loss": 0.0317, "step": 18220 }, { "epoch": 0.2, "learning_rate": 0.00027043847700590257, "loss": 0.0301, "step": 18230 }, { "epoch": 0.2, "learning_rate": 0.00027042226114029963, "loss": 0.0313, "step": 18240 }, { "epoch": 0.2, "learning_rate": 0.00027040604527469675, "loss": 0.0273, "step": 18250 }, { "epoch": 0.2, "learning_rate": 0.0002703898294090938, "loss": 0.0238, "step": 18260 }, { "epoch": 0.2, "learning_rate": 0.00027037361354349094, "loss": 0.0262, "step": 18270 }, { "epoch": 0.2, "learning_rate": 0.000270357397677888, "loss": 0.0282, "step": 18280 }, { "epoch": 0.2, "learning_rate": 0.0002703411818122851, "loss": 0.0286, "step": 18290 }, { "epoch": 0.2, "learning_rate": 0.0002703249659466822, "loss": 0.0243, "step": 18300 }, { "epoch": 0.2, "learning_rate": 0.0002703087500810793, "loss": 0.0243, "step": 18310 }, { "epoch": 0.2, "learning_rate": 0.0002702925342154764, "loss": 0.0248, "step": 18320 }, { "epoch": 0.2, "learning_rate": 0.0002702763183498735, "loss": 0.0292, "step": 18330 }, { "epoch": 0.2, "learning_rate": 0.0002702601024842706, "loss": 0.0247, "step": 18340 }, { "epoch": 0.2, "learning_rate": 0.0002702438866186677, "loss": 0.0278, "step": 18350 }, { "epoch": 0.2, "learning_rate": 0.00027022767075306474, "loss": 0.0287, "step": 18360 }, { "epoch": 0.2, "learning_rate": 0.00027021145488746186, "loss": 0.03, "step": 18370 }, { "epoch": 0.2, "learning_rate": 0.000270195239021859, "loss": 0.0285, "step": 18380 }, { "epoch": 0.2, "learning_rate": 0.00027017902315625605, "loss": 0.0234, "step": 18390 }, { "epoch": 0.2, "learning_rate": 0.0002701628072906531, "loss": 0.0266, "step": 18400 }, { "epoch": 0.2, "learning_rate": 0.00027014659142505024, "loss": 0.0294, "step": 18410 }, { "epoch": 0.2, "learning_rate": 0.00027013037555944736, "loss": 0.0313, "step": 18420 }, { "epoch": 0.2, "learning_rate": 0.0002701141596938444, "loss": 0.0285, "step": 18430 }, { "epoch": 0.2, "learning_rate": 0.00027009794382824154, "loss": 0.0252, "step": 18440 }, { "epoch": 0.2, "learning_rate": 0.0002700817279626386, "loss": 0.0297, "step": 18450 }, { "epoch": 0.2, "learning_rate": 0.0002700655120970357, "loss": 0.028, "step": 18460 }, { "epoch": 0.2, "learning_rate": 0.00027004929623143285, "loss": 0.0297, "step": 18470 }, { "epoch": 0.2, "learning_rate": 0.0002700330803658299, "loss": 0.0306, "step": 18480 }, { "epoch": 0.2, "learning_rate": 0.000270016864500227, "loss": 0.0242, "step": 18490 }, { "epoch": 0.2, "learning_rate": 0.0002700006486346241, "loss": 0.0296, "step": 18500 }, { "epoch": 0.2, "learning_rate": 0.0002699844327690212, "loss": 0.026, "step": 18510 }, { "epoch": 0.2, "learning_rate": 0.0002699682169034183, "loss": 0.0288, "step": 18520 }, { "epoch": 0.2, "learning_rate": 0.00026995200103781535, "loss": 0.0288, "step": 18530 }, { "epoch": 0.2, "learning_rate": 0.00026993578517221247, "loss": 0.0295, "step": 18540 }, { "epoch": 0.2, "learning_rate": 0.0002699195693066096, "loss": 0.0321, "step": 18550 }, { "epoch": 0.2, "learning_rate": 0.00026990335344100665, "loss": 0.0283, "step": 18560 }, { "epoch": 0.2, "learning_rate": 0.0002698871375754037, "loss": 0.0298, "step": 18570 }, { "epoch": 0.2, "learning_rate": 0.00026987092170980084, "loss": 0.0317, "step": 18580 }, { "epoch": 0.2, "learning_rate": 0.00026985470584419796, "loss": 0.0253, "step": 18590 }, { "epoch": 0.2, "learning_rate": 0.000269838489978595, "loss": 0.0339, "step": 18600 }, { "epoch": 0.2, "learning_rate": 0.00026982227411299214, "loss": 0.0248, "step": 18610 }, { "epoch": 0.2, "learning_rate": 0.0002698060582473892, "loss": 0.0303, "step": 18620 }, { "epoch": 0.2, "learning_rate": 0.00026978984238178633, "loss": 0.0263, "step": 18630 }, { "epoch": 0.2, "learning_rate": 0.0002697736265161834, "loss": 0.0587, "step": 18640 }, { "epoch": 0.2, "learning_rate": 0.0002697574106505805, "loss": 0.0643, "step": 18650 }, { "epoch": 0.2, "learning_rate": 0.0002697411947849776, "loss": 0.0374, "step": 18660 }, { "epoch": 0.2, "learning_rate": 0.0002697249789193747, "loss": 0.0332, "step": 18670 }, { "epoch": 0.2, "learning_rate": 0.00026970876305377177, "loss": 0.0342, "step": 18680 }, { "epoch": 0.2, "learning_rate": 0.0002696925471881689, "loss": 0.0264, "step": 18690 }, { "epoch": 0.2, "learning_rate": 0.00026967633132256595, "loss": 0.0283, "step": 18700 }, { "epoch": 0.2, "learning_rate": 0.00026966011545696307, "loss": 0.0265, "step": 18710 }, { "epoch": 0.2, "learning_rate": 0.0002696438995913602, "loss": 0.0361, "step": 18720 }, { "epoch": 0.2, "learning_rate": 0.00026962768372575726, "loss": 0.036, "step": 18730 }, { "epoch": 0.2, "learning_rate": 0.0002696114678601544, "loss": 0.0301, "step": 18740 }, { "epoch": 0.2, "learning_rate": 0.00026959525199455144, "loss": 0.0298, "step": 18750 }, { "epoch": 0.2, "learning_rate": 0.00026957903612894856, "loss": 0.0279, "step": 18760 }, { "epoch": 0.2, "learning_rate": 0.00026956282026334563, "loss": 0.0389, "step": 18770 }, { "epoch": 0.2, "learning_rate": 0.00026954660439774275, "loss": 0.0305, "step": 18780 }, { "epoch": 0.2, "learning_rate": 0.0002695303885321398, "loss": 0.0445, "step": 18790 }, { "epoch": 0.2, "learning_rate": 0.00026951417266653693, "loss": 0.0261, "step": 18800 }, { "epoch": 0.2, "learning_rate": 0.000269497956800934, "loss": 0.0324, "step": 18810 }, { "epoch": 0.2, "learning_rate": 0.0002694817409353311, "loss": 0.0281, "step": 18820 }, { "epoch": 0.2, "learning_rate": 0.0002694655250697282, "loss": 0.0305, "step": 18830 }, { "epoch": 0.2, "learning_rate": 0.0002694493092041253, "loss": 0.0272, "step": 18840 }, { "epoch": 0.2, "learning_rate": 0.00026943309333852237, "loss": 0.0339, "step": 18850 }, { "epoch": 0.2, "learning_rate": 0.0002694168774729195, "loss": 0.0312, "step": 18860 }, { "epoch": 0.2, "learning_rate": 0.00026940066160731656, "loss": 0.0403, "step": 18870 }, { "epoch": 0.2, "learning_rate": 0.0002693844457417137, "loss": 0.0301, "step": 18880 }, { "epoch": 0.2, "learning_rate": 0.00026936822987611074, "loss": 0.0408, "step": 18890 }, { "epoch": 0.2, "learning_rate": 0.00026935201401050786, "loss": 0.0542, "step": 18900 }, { "epoch": 0.2, "learning_rate": 0.000269335798144905, "loss": 0.0271, "step": 18910 }, { "epoch": 0.2, "learning_rate": 0.00026931958227930205, "loss": 0.033, "step": 18920 }, { "epoch": 0.2, "learning_rate": 0.0002693033664136991, "loss": 0.0299, "step": 18930 }, { "epoch": 0.2, "learning_rate": 0.00026928715054809623, "loss": 0.0296, "step": 18940 }, { "epoch": 0.2, "learning_rate": 0.00026927093468249335, "loss": 0.027, "step": 18950 }, { "epoch": 0.2, "learning_rate": 0.0002692547188168904, "loss": 0.0291, "step": 18960 }, { "epoch": 0.21, "learning_rate": 0.0002692385029512875, "loss": 0.0305, "step": 18970 }, { "epoch": 0.21, "learning_rate": 0.0002692222870856846, "loss": 0.0283, "step": 18980 }, { "epoch": 0.21, "learning_rate": 0.0002692060712200817, "loss": 0.0291, "step": 18990 }, { "epoch": 0.21, "learning_rate": 0.0002691898553544788, "loss": 0.0274, "step": 19000 }, { "epoch": 0.21, "eval_cer": 0.9216233494372321, "eval_loss": 0.022243507206439972, "eval_runtime": 120.016, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 19000 }, { "epoch": 0.21, "learning_rate": 0.00026917363948887585, "loss": 0.0291, "step": 19010 }, { "epoch": 0.21, "learning_rate": 0.000269157423623273, "loss": 0.0257, "step": 19020 }, { "epoch": 0.21, "learning_rate": 0.0002691412077576701, "loss": 0.0274, "step": 19030 }, { "epoch": 0.21, "learning_rate": 0.0002691249918920672, "loss": 0.0343, "step": 19040 }, { "epoch": 0.21, "learning_rate": 0.0002691087760264643, "loss": 0.03, "step": 19050 }, { "epoch": 0.21, "learning_rate": 0.00026909256016086134, "loss": 0.0305, "step": 19060 }, { "epoch": 0.21, "learning_rate": 0.00026907634429525846, "loss": 0.0292, "step": 19070 }, { "epoch": 0.21, "learning_rate": 0.0002690601284296556, "loss": 0.0297, "step": 19080 }, { "epoch": 0.21, "learning_rate": 0.00026904391256405265, "loss": 0.031, "step": 19090 }, { "epoch": 0.21, "learning_rate": 0.0002690276966984497, "loss": 0.0278, "step": 19100 }, { "epoch": 0.21, "learning_rate": 0.00026901148083284684, "loss": 0.031, "step": 19110 }, { "epoch": 0.21, "learning_rate": 0.00026899526496724396, "loss": 0.0353, "step": 19120 }, { "epoch": 0.21, "learning_rate": 0.000268979049101641, "loss": 0.0246, "step": 19130 }, { "epoch": 0.21, "learning_rate": 0.0002689628332360381, "loss": 0.0328, "step": 19140 }, { "epoch": 0.21, "learning_rate": 0.0002689466173704352, "loss": 0.0299, "step": 19150 }, { "epoch": 0.21, "learning_rate": 0.0002689304015048323, "loss": 0.0296, "step": 19160 }, { "epoch": 0.21, "learning_rate": 0.0002689141856392294, "loss": 0.0277, "step": 19170 }, { "epoch": 0.21, "learning_rate": 0.0002688979697736265, "loss": 0.0293, "step": 19180 }, { "epoch": 0.21, "learning_rate": 0.0002688817539080236, "loss": 0.0296, "step": 19190 }, { "epoch": 0.21, "learning_rate": 0.0002688655380424207, "loss": 0.0283, "step": 19200 }, { "epoch": 0.21, "learning_rate": 0.00026884932217681776, "loss": 0.0287, "step": 19210 }, { "epoch": 0.21, "learning_rate": 0.0002688331063112149, "loss": 0.0256, "step": 19220 }, { "epoch": 0.21, "learning_rate": 0.00026881689044561195, "loss": 0.0254, "step": 19230 }, { "epoch": 0.21, "learning_rate": 0.00026880067458000907, "loss": 0.0301, "step": 19240 }, { "epoch": 0.21, "learning_rate": 0.00026878445871440613, "loss": 0.0235, "step": 19250 }, { "epoch": 0.21, "learning_rate": 0.00026876824284880325, "loss": 0.029, "step": 19260 }, { "epoch": 0.21, "learning_rate": 0.0002687520269832003, "loss": 0.0294, "step": 19270 }, { "epoch": 0.21, "learning_rate": 0.00026873581111759744, "loss": 0.0298, "step": 19280 }, { "epoch": 0.21, "learning_rate": 0.0002687195952519945, "loss": 0.0276, "step": 19290 }, { "epoch": 0.21, "learning_rate": 0.0002687033793863916, "loss": 0.0253, "step": 19300 }, { "epoch": 0.21, "learning_rate": 0.0002686871635207887, "loss": 0.0269, "step": 19310 }, { "epoch": 0.21, "learning_rate": 0.0002686709476551858, "loss": 0.0346, "step": 19320 }, { "epoch": 0.21, "learning_rate": 0.0002686547317895829, "loss": 0.0328, "step": 19330 }, { "epoch": 0.21, "learning_rate": 0.00026863851592398, "loss": 0.0235, "step": 19340 }, { "epoch": 0.21, "learning_rate": 0.0002686223000583771, "loss": 0.0267, "step": 19350 }, { "epoch": 0.21, "learning_rate": 0.0002686060841927742, "loss": 0.0253, "step": 19360 }, { "epoch": 0.21, "learning_rate": 0.00026858986832717125, "loss": 0.0265, "step": 19370 }, { "epoch": 0.21, "learning_rate": 0.00026857365246156837, "loss": 0.0257, "step": 19380 }, { "epoch": 0.21, "learning_rate": 0.0002685574365959655, "loss": 0.0284, "step": 19390 }, { "epoch": 0.21, "learning_rate": 0.00026854122073036255, "loss": 0.0307, "step": 19400 }, { "epoch": 0.21, "learning_rate": 0.0002685250048647596, "loss": 0.0284, "step": 19410 }, { "epoch": 0.21, "learning_rate": 0.00026850878899915674, "loss": 0.0336, "step": 19420 }, { "epoch": 0.21, "learning_rate": 0.00026849257313355386, "loss": 0.0304, "step": 19430 }, { "epoch": 0.21, "learning_rate": 0.0002684763572679509, "loss": 0.0242, "step": 19440 }, { "epoch": 0.21, "learning_rate": 0.00026846014140234804, "loss": 0.0359, "step": 19450 }, { "epoch": 0.21, "learning_rate": 0.0002684439255367451, "loss": 0.0265, "step": 19460 }, { "epoch": 0.21, "learning_rate": 0.00026842770967114223, "loss": 0.0265, "step": 19470 }, { "epoch": 0.21, "learning_rate": 0.00026841149380553935, "loss": 0.0276, "step": 19480 }, { "epoch": 0.21, "learning_rate": 0.0002683952779399364, "loss": 0.0267, "step": 19490 }, { "epoch": 0.21, "learning_rate": 0.0002683790620743335, "loss": 0.0272, "step": 19500 }, { "epoch": 0.21, "learning_rate": 0.0002683628462087306, "loss": 0.0261, "step": 19510 }, { "epoch": 0.21, "learning_rate": 0.0002683466303431277, "loss": 0.028, "step": 19520 }, { "epoch": 0.21, "learning_rate": 0.0002683304144775248, "loss": 0.0232, "step": 19530 }, { "epoch": 0.21, "learning_rate": 0.00026831419861192185, "loss": 0.0276, "step": 19540 }, { "epoch": 0.21, "learning_rate": 0.00026829798274631897, "loss": 0.0282, "step": 19550 }, { "epoch": 0.21, "learning_rate": 0.0002682817668807161, "loss": 0.0262, "step": 19560 }, { "epoch": 0.21, "learning_rate": 0.00026826555101511316, "loss": 0.0274, "step": 19570 }, { "epoch": 0.21, "learning_rate": 0.0002682493351495102, "loss": 0.028, "step": 19580 }, { "epoch": 0.21, "learning_rate": 0.00026823311928390734, "loss": 0.0279, "step": 19590 }, { "epoch": 0.21, "learning_rate": 0.00026821690341830446, "loss": 0.0284, "step": 19600 }, { "epoch": 0.21, "learning_rate": 0.0002682006875527016, "loss": 0.0255, "step": 19610 }, { "epoch": 0.21, "learning_rate": 0.00026818447168709865, "loss": 0.0294, "step": 19620 }, { "epoch": 0.21, "learning_rate": 0.0002681682558214957, "loss": 0.0328, "step": 19630 }, { "epoch": 0.21, "learning_rate": 0.00026815203995589283, "loss": 0.0333, "step": 19640 }, { "epoch": 0.21, "learning_rate": 0.00026813582409028995, "loss": 0.0305, "step": 19650 }, { "epoch": 0.21, "learning_rate": 0.000268119608224687, "loss": 0.0258, "step": 19660 }, { "epoch": 0.21, "learning_rate": 0.0002681033923590841, "loss": 0.0427, "step": 19670 }, { "epoch": 0.21, "learning_rate": 0.0002680871764934812, "loss": 0.0323, "step": 19680 }, { "epoch": 0.21, "learning_rate": 0.0002680709606278783, "loss": 0.0248, "step": 19690 }, { "epoch": 0.21, "learning_rate": 0.0002680547447622754, "loss": 0.0286, "step": 19700 }, { "epoch": 0.21, "learning_rate": 0.00026803852889667245, "loss": 0.024, "step": 19710 }, { "epoch": 0.21, "learning_rate": 0.0002680223130310696, "loss": 0.0279, "step": 19720 }, { "epoch": 0.21, "learning_rate": 0.0002680060971654667, "loss": 0.0254, "step": 19730 }, { "epoch": 0.21, "learning_rate": 0.00026798988129986376, "loss": 0.029, "step": 19740 }, { "epoch": 0.21, "learning_rate": 0.0002679736654342609, "loss": 0.0293, "step": 19750 }, { "epoch": 0.21, "learning_rate": 0.00026795744956865795, "loss": 0.0238, "step": 19760 }, { "epoch": 0.21, "learning_rate": 0.00026794123370305507, "loss": 0.0297, "step": 19770 }, { "epoch": 0.21, "learning_rate": 0.00026792501783745213, "loss": 0.0305, "step": 19780 }, { "epoch": 0.21, "learning_rate": 0.00026790880197184925, "loss": 0.0282, "step": 19790 }, { "epoch": 0.21, "learning_rate": 0.0002678925861062463, "loss": 0.0257, "step": 19800 }, { "epoch": 0.21, "learning_rate": 0.00026787637024064344, "loss": 0.0267, "step": 19810 }, { "epoch": 0.21, "learning_rate": 0.0002678601543750405, "loss": 0.0316, "step": 19820 }, { "epoch": 0.21, "learning_rate": 0.0002678439385094376, "loss": 0.0305, "step": 19830 }, { "epoch": 0.21, "learning_rate": 0.0002678277226438347, "loss": 0.0368, "step": 19840 }, { "epoch": 0.21, "learning_rate": 0.0002678115067782318, "loss": 0.0294, "step": 19850 }, { "epoch": 0.21, "learning_rate": 0.00026779529091262887, "loss": 0.0332, "step": 19860 }, { "epoch": 0.21, "learning_rate": 0.000267779075047026, "loss": 0.0253, "step": 19870 }, { "epoch": 0.21, "learning_rate": 0.00026776285918142306, "loss": 0.0275, "step": 19880 }, { "epoch": 0.22, "learning_rate": 0.0002677466433158202, "loss": 0.0289, "step": 19890 }, { "epoch": 0.22, "learning_rate": 0.00026773042745021724, "loss": 0.0245, "step": 19900 }, { "epoch": 0.22, "learning_rate": 0.00026771421158461436, "loss": 0.0255, "step": 19910 }, { "epoch": 0.22, "learning_rate": 0.0002676979957190115, "loss": 0.0305, "step": 19920 }, { "epoch": 0.22, "learning_rate": 0.00026768177985340855, "loss": 0.0281, "step": 19930 }, { "epoch": 0.22, "learning_rate": 0.0002676655639878056, "loss": 0.0294, "step": 19940 }, { "epoch": 0.22, "learning_rate": 0.00026764934812220273, "loss": 0.0317, "step": 19950 }, { "epoch": 0.22, "learning_rate": 0.00026763313225659985, "loss": 0.0255, "step": 19960 }, { "epoch": 0.22, "learning_rate": 0.0002676169163909969, "loss": 0.0508, "step": 19970 }, { "epoch": 0.22, "learning_rate": 0.000267600700525394, "loss": 0.0264, "step": 19980 }, { "epoch": 0.22, "learning_rate": 0.0002675844846597911, "loss": 0.0294, "step": 19990 }, { "epoch": 0.22, "learning_rate": 0.0002675682687941882, "loss": 0.0317, "step": 20000 }, { "epoch": 0.22, "eval_cer": 0.9216077145840174, "eval_loss": 0.02043878473341465, "eval_runtime": 120.3911, "eval_samples_per_second": 16.613, "eval_steps_per_second": 4.153, "step": 20000 }, { "epoch": 0.22, "learning_rate": 0.0002675520529285853, "loss": 0.0298, "step": 20010 }, { "epoch": 0.22, "learning_rate": 0.00026753583706298236, "loss": 0.0325, "step": 20020 }, { "epoch": 0.22, "learning_rate": 0.0002675196211973795, "loss": 0.0254, "step": 20030 }, { "epoch": 0.22, "learning_rate": 0.0002675034053317766, "loss": 0.0263, "step": 20040 }, { "epoch": 0.22, "learning_rate": 0.0002674871894661737, "loss": 0.0387, "step": 20050 }, { "epoch": 0.22, "learning_rate": 0.0002674709736005708, "loss": 0.0298, "step": 20060 }, { "epoch": 0.22, "learning_rate": 0.00026745475773496785, "loss": 0.0299, "step": 20070 }, { "epoch": 0.22, "learning_rate": 0.00026743854186936497, "loss": 0.031, "step": 20080 }, { "epoch": 0.22, "learning_rate": 0.0002674223260037621, "loss": 0.0245, "step": 20090 }, { "epoch": 0.22, "learning_rate": 0.00026740611013815915, "loss": 0.0261, "step": 20100 }, { "epoch": 0.22, "learning_rate": 0.0002673898942725562, "loss": 0.0246, "step": 20110 }, { "epoch": 0.22, "learning_rate": 0.00026737367840695334, "loss": 0.0301, "step": 20120 }, { "epoch": 0.22, "learning_rate": 0.00026735746254135046, "loss": 0.0328, "step": 20130 }, { "epoch": 0.22, "learning_rate": 0.0002673412466757475, "loss": 0.0368, "step": 20140 }, { "epoch": 0.22, "learning_rate": 0.0002673250308101446, "loss": 0.029, "step": 20150 }, { "epoch": 0.22, "learning_rate": 0.0002673088149445417, "loss": 0.0261, "step": 20160 }, { "epoch": 0.22, "learning_rate": 0.00026729259907893883, "loss": 0.0297, "step": 20170 }, { "epoch": 0.22, "learning_rate": 0.0002672763832133359, "loss": 0.0257, "step": 20180 }, { "epoch": 0.22, "learning_rate": 0.000267260167347733, "loss": 0.0292, "step": 20190 }, { "epoch": 0.22, "learning_rate": 0.0002672439514821301, "loss": 0.0261, "step": 20200 }, { "epoch": 0.22, "learning_rate": 0.0002672277356165272, "loss": 0.0288, "step": 20210 }, { "epoch": 0.22, "learning_rate": 0.0002672115197509243, "loss": 0.0341, "step": 20220 }, { "epoch": 0.22, "learning_rate": 0.0002671953038853214, "loss": 0.0311, "step": 20230 }, { "epoch": 0.22, "learning_rate": 0.00026717908801971845, "loss": 0.0314, "step": 20240 }, { "epoch": 0.22, "learning_rate": 0.00026716287215411557, "loss": 0.0449, "step": 20250 }, { "epoch": 0.22, "learning_rate": 0.0002671466562885127, "loss": 0.0258, "step": 20260 }, { "epoch": 0.22, "learning_rate": 0.00026713044042290976, "loss": 0.0386, "step": 20270 }, { "epoch": 0.22, "learning_rate": 0.0002671142245573068, "loss": 0.0281, "step": 20280 }, { "epoch": 0.22, "learning_rate": 0.00026709800869170394, "loss": 0.0306, "step": 20290 }, { "epoch": 0.22, "learning_rate": 0.00026708179282610106, "loss": 0.025, "step": 20300 }, { "epoch": 0.22, "learning_rate": 0.00026706557696049813, "loss": 0.028, "step": 20310 }, { "epoch": 0.22, "learning_rate": 0.0002670493610948952, "loss": 0.0279, "step": 20320 }, { "epoch": 0.22, "learning_rate": 0.0002670331452292923, "loss": 0.026, "step": 20330 }, { "epoch": 0.22, "learning_rate": 0.00026701692936368943, "loss": 0.0238, "step": 20340 }, { "epoch": 0.22, "learning_rate": 0.0002670007134980865, "loss": 0.0223, "step": 20350 }, { "epoch": 0.22, "learning_rate": 0.0002669844976324836, "loss": 0.0271, "step": 20360 }, { "epoch": 0.22, "learning_rate": 0.0002669682817668807, "loss": 0.0269, "step": 20370 }, { "epoch": 0.22, "learning_rate": 0.0002669520659012778, "loss": 0.0323, "step": 20380 }, { "epoch": 0.22, "learning_rate": 0.00026693585003567487, "loss": 0.0266, "step": 20390 }, { "epoch": 0.22, "learning_rate": 0.000266919634170072, "loss": 0.0281, "step": 20400 }, { "epoch": 0.22, "learning_rate": 0.00026690341830446905, "loss": 0.0246, "step": 20410 }, { "epoch": 0.22, "learning_rate": 0.0002668872024388662, "loss": 0.0298, "step": 20420 }, { "epoch": 0.22, "learning_rate": 0.00026687098657326324, "loss": 0.0241, "step": 20430 }, { "epoch": 0.22, "learning_rate": 0.00026685477070766036, "loss": 0.0393, "step": 20440 }, { "epoch": 0.22, "learning_rate": 0.0002668385548420574, "loss": 0.0351, "step": 20450 }, { "epoch": 0.22, "learning_rate": 0.00026682233897645455, "loss": 0.0343, "step": 20460 }, { "epoch": 0.22, "learning_rate": 0.0002668061231108516, "loss": 0.0337, "step": 20470 }, { "epoch": 0.22, "learning_rate": 0.00026678990724524873, "loss": 0.0297, "step": 20480 }, { "epoch": 0.22, "learning_rate": 0.00026677369137964585, "loss": 0.0314, "step": 20490 }, { "epoch": 0.22, "learning_rate": 0.0002667574755140429, "loss": 0.0264, "step": 20500 }, { "epoch": 0.22, "learning_rate": 0.00026674125964844, "loss": 0.0279, "step": 20510 }, { "epoch": 0.22, "learning_rate": 0.0002667250437828371, "loss": 0.0329, "step": 20520 }, { "epoch": 0.22, "learning_rate": 0.0002667088279172342, "loss": 0.0273, "step": 20530 }, { "epoch": 0.22, "learning_rate": 0.0002666926120516313, "loss": 0.0347, "step": 20540 }, { "epoch": 0.22, "learning_rate": 0.00026667639618602835, "loss": 0.0327, "step": 20550 }, { "epoch": 0.22, "learning_rate": 0.0002666601803204255, "loss": 0.0309, "step": 20560 }, { "epoch": 0.22, "learning_rate": 0.0002666439644548226, "loss": 0.0256, "step": 20570 }, { "epoch": 0.22, "learning_rate": 0.00026662774858921966, "loss": 0.0309, "step": 20580 }, { "epoch": 0.22, "learning_rate": 0.0002666115327236167, "loss": 0.0315, "step": 20590 }, { "epoch": 0.22, "learning_rate": 0.00026659531685801384, "loss": 0.0257, "step": 20600 }, { "epoch": 0.22, "learning_rate": 0.00026657910099241096, "loss": 0.0237, "step": 20610 }, { "epoch": 0.22, "learning_rate": 0.0002665628851268081, "loss": 0.0279, "step": 20620 }, { "epoch": 0.22, "learning_rate": 0.00026654666926120515, "loss": 0.0245, "step": 20630 }, { "epoch": 0.22, "learning_rate": 0.0002665304533956022, "loss": 0.0466, "step": 20640 }, { "epoch": 0.22, "learning_rate": 0.00026651423752999933, "loss": 0.0265, "step": 20650 }, { "epoch": 0.22, "learning_rate": 0.00026649802166439645, "loss": 0.026, "step": 20660 }, { "epoch": 0.22, "learning_rate": 0.0002664818057987935, "loss": 0.026, "step": 20670 }, { "epoch": 0.22, "learning_rate": 0.0002664655899331906, "loss": 0.0326, "step": 20680 }, { "epoch": 0.22, "learning_rate": 0.0002664493740675877, "loss": 0.0262, "step": 20690 }, { "epoch": 0.22, "learning_rate": 0.0002664331582019848, "loss": 0.0243, "step": 20700 }, { "epoch": 0.22, "learning_rate": 0.0002664169423363819, "loss": 0.0278, "step": 20710 }, { "epoch": 0.22, "learning_rate": 0.00026640072647077896, "loss": 0.0297, "step": 20720 }, { "epoch": 0.22, "learning_rate": 0.0002663845106051761, "loss": 0.0281, "step": 20730 }, { "epoch": 0.22, "learning_rate": 0.0002663682947395732, "loss": 0.0271, "step": 20740 }, { "epoch": 0.22, "learning_rate": 0.00026635207887397026, "loss": 0.0273, "step": 20750 }, { "epoch": 0.22, "learning_rate": 0.0002663358630083674, "loss": 0.0252, "step": 20760 }, { "epoch": 0.22, "learning_rate": 0.00026631964714276445, "loss": 0.0302, "step": 20770 }, { "epoch": 0.22, "learning_rate": 0.00026630343127716157, "loss": 0.0284, "step": 20780 }, { "epoch": 0.22, "learning_rate": 0.00026628721541155863, "loss": 0.0265, "step": 20790 }, { "epoch": 0.22, "learning_rate": 0.00026627099954595575, "loss": 0.0278, "step": 20800 }, { "epoch": 0.22, "learning_rate": 0.0002662547836803528, "loss": 0.0279, "step": 20810 }, { "epoch": 0.23, "learning_rate": 0.00026623856781474994, "loss": 0.0279, "step": 20820 }, { "epoch": 0.23, "learning_rate": 0.000266222351949147, "loss": 0.0246, "step": 20830 }, { "epoch": 0.23, "learning_rate": 0.0002662061360835441, "loss": 0.0272, "step": 20840 }, { "epoch": 0.23, "learning_rate": 0.0002661899202179412, "loss": 0.0249, "step": 20850 }, { "epoch": 0.23, "learning_rate": 0.0002661737043523383, "loss": 0.0272, "step": 20860 }, { "epoch": 0.23, "learning_rate": 0.00026615748848673543, "loss": 0.029, "step": 20870 }, { "epoch": 0.23, "learning_rate": 0.0002661412726211325, "loss": 0.0222, "step": 20880 }, { "epoch": 0.23, "learning_rate": 0.00026612505675552956, "loss": 0.023, "step": 20890 }, { "epoch": 0.23, "learning_rate": 0.0002661088408899267, "loss": 0.0285, "step": 20900 }, { "epoch": 0.23, "learning_rate": 0.0002660926250243238, "loss": 0.0311, "step": 20910 }, { "epoch": 0.23, "learning_rate": 0.00026607640915872087, "loss": 0.0282, "step": 20920 }, { "epoch": 0.23, "learning_rate": 0.000266060193293118, "loss": 0.0279, "step": 20930 }, { "epoch": 0.23, "learning_rate": 0.00026604397742751505, "loss": 0.0249, "step": 20940 }, { "epoch": 0.23, "learning_rate": 0.00026602776156191217, "loss": 0.0245, "step": 20950 }, { "epoch": 0.23, "learning_rate": 0.00026601154569630924, "loss": 0.0301, "step": 20960 }, { "epoch": 0.23, "learning_rate": 0.00026599532983070636, "loss": 0.0273, "step": 20970 }, { "epoch": 0.23, "learning_rate": 0.0002659791139651034, "loss": 0.0271, "step": 20980 }, { "epoch": 0.23, "learning_rate": 0.00026596289809950054, "loss": 0.027, "step": 20990 }, { "epoch": 0.23, "learning_rate": 0.0002659466822338976, "loss": 0.0248, "step": 21000 }, { "epoch": 0.23, "eval_cer": 0.9216103203928865, "eval_loss": 0.020444829016923904, "eval_runtime": 120.2567, "eval_samples_per_second": 16.631, "eval_steps_per_second": 4.158, "step": 21000 }, { "epoch": 0.23, "learning_rate": 0.00026593046636829473, "loss": 0.0277, "step": 21010 }, { "epoch": 0.23, "learning_rate": 0.0002659142505026918, "loss": 0.0304, "step": 21020 }, { "epoch": 0.23, "learning_rate": 0.0002658980346370889, "loss": 0.0277, "step": 21030 }, { "epoch": 0.23, "learning_rate": 0.000265881818771486, "loss": 0.0313, "step": 21040 }, { "epoch": 0.23, "learning_rate": 0.0002658656029058831, "loss": 0.0321, "step": 21050 }, { "epoch": 0.23, "learning_rate": 0.0002658493870402802, "loss": 0.0262, "step": 21060 }, { "epoch": 0.23, "learning_rate": 0.0002658331711746773, "loss": 0.0269, "step": 21070 }, { "epoch": 0.23, "learning_rate": 0.00026581695530907435, "loss": 0.0349, "step": 21080 }, { "epoch": 0.23, "learning_rate": 0.00026580073944347147, "loss": 0.0271, "step": 21090 }, { "epoch": 0.23, "learning_rate": 0.0002657845235778686, "loss": 0.0371, "step": 21100 }, { "epoch": 0.23, "learning_rate": 0.00026576830771226566, "loss": 0.0293, "step": 21110 }, { "epoch": 0.23, "learning_rate": 0.0002657520918466627, "loss": 0.0258, "step": 21120 }, { "epoch": 0.23, "learning_rate": 0.00026573587598105984, "loss": 0.0293, "step": 21130 }, { "epoch": 0.23, "learning_rate": 0.00026571966011545696, "loss": 0.0288, "step": 21140 }, { "epoch": 0.23, "learning_rate": 0.000265703444249854, "loss": 0.0282, "step": 21150 }, { "epoch": 0.23, "learning_rate": 0.0002656872283842511, "loss": 0.0323, "step": 21160 }, { "epoch": 0.23, "learning_rate": 0.0002656710125186482, "loss": 0.0274, "step": 21170 }, { "epoch": 0.23, "learning_rate": 0.00026565479665304533, "loss": 0.0253, "step": 21180 }, { "epoch": 0.23, "learning_rate": 0.0002656385807874424, "loss": 0.0245, "step": 21190 }, { "epoch": 0.23, "learning_rate": 0.0002656223649218395, "loss": 0.0291, "step": 21200 }, { "epoch": 0.23, "learning_rate": 0.0002656061490562366, "loss": 0.0237, "step": 21210 }, { "epoch": 0.23, "learning_rate": 0.0002655899331906337, "loss": 0.0235, "step": 21220 }, { "epoch": 0.23, "learning_rate": 0.0002655737173250308, "loss": 0.0274, "step": 21230 }, { "epoch": 0.23, "learning_rate": 0.0002655575014594279, "loss": 0.0245, "step": 21240 }, { "epoch": 0.23, "learning_rate": 0.00026554128559382495, "loss": 0.0273, "step": 21250 }, { "epoch": 0.23, "learning_rate": 0.0002655250697282221, "loss": 0.0253, "step": 21260 }, { "epoch": 0.23, "learning_rate": 0.0002655088538626192, "loss": 0.0266, "step": 21270 }, { "epoch": 0.23, "learning_rate": 0.00026549263799701626, "loss": 0.0442, "step": 21280 }, { "epoch": 0.23, "learning_rate": 0.0002654764221314133, "loss": 0.0368, "step": 21290 }, { "epoch": 0.23, "learning_rate": 0.00026546020626581044, "loss": 0.0298, "step": 21300 }, { "epoch": 0.23, "learning_rate": 0.00026544399040020756, "loss": 0.0337, "step": 21310 }, { "epoch": 0.23, "learning_rate": 0.00026542777453460463, "loss": 0.0249, "step": 21320 }, { "epoch": 0.23, "learning_rate": 0.0002654115586690017, "loss": 0.0333, "step": 21330 }, { "epoch": 0.23, "learning_rate": 0.0002653953428033988, "loss": 0.026, "step": 21340 }, { "epoch": 0.23, "learning_rate": 0.00026537912693779594, "loss": 0.0329, "step": 21350 }, { "epoch": 0.23, "learning_rate": 0.000265362911072193, "loss": 0.0336, "step": 21360 }, { "epoch": 0.23, "learning_rate": 0.0002653466952065901, "loss": 0.0282, "step": 21370 }, { "epoch": 0.23, "learning_rate": 0.0002653304793409872, "loss": 0.0274, "step": 21380 }, { "epoch": 0.23, "learning_rate": 0.0002653142634753843, "loss": 0.026, "step": 21390 }, { "epoch": 0.23, "learning_rate": 0.00026529804760978137, "loss": 0.0332, "step": 21400 }, { "epoch": 0.23, "learning_rate": 0.0002652818317441785, "loss": 0.027, "step": 21410 }, { "epoch": 0.23, "learning_rate": 0.00026526561587857556, "loss": 0.0242, "step": 21420 }, { "epoch": 0.23, "learning_rate": 0.0002652494000129727, "loss": 0.0276, "step": 21430 }, { "epoch": 0.23, "learning_rate": 0.00026523318414736974, "loss": 0.0244, "step": 21440 }, { "epoch": 0.23, "learning_rate": 0.00026521696828176686, "loss": 0.0316, "step": 21450 }, { "epoch": 0.23, "learning_rate": 0.00026520075241616393, "loss": 0.027, "step": 21460 }, { "epoch": 0.23, "learning_rate": 0.00026518453655056105, "loss": 0.0302, "step": 21470 }, { "epoch": 0.23, "learning_rate": 0.0002651683206849581, "loss": 0.0316, "step": 21480 }, { "epoch": 0.23, "learning_rate": 0.00026515210481935523, "loss": 0.0273, "step": 21490 }, { "epoch": 0.23, "learning_rate": 0.00026513588895375235, "loss": 0.0256, "step": 21500 }, { "epoch": 0.23, "learning_rate": 0.0002651196730881494, "loss": 0.0251, "step": 21510 }, { "epoch": 0.23, "learning_rate": 0.0002651034572225465, "loss": 0.0313, "step": 21520 }, { "epoch": 0.23, "learning_rate": 0.0002650872413569436, "loss": 0.03, "step": 21530 }, { "epoch": 0.23, "learning_rate": 0.0002650710254913407, "loss": 0.0249, "step": 21540 }, { "epoch": 0.23, "learning_rate": 0.0002650548096257378, "loss": 0.0254, "step": 21550 }, { "epoch": 0.23, "learning_rate": 0.00026503859376013486, "loss": 0.0225, "step": 21560 }, { "epoch": 0.23, "learning_rate": 0.000265022377894532, "loss": 0.031, "step": 21570 }, { "epoch": 0.23, "learning_rate": 0.0002650061620289291, "loss": 0.027, "step": 21580 }, { "epoch": 0.23, "learning_rate": 0.00026498994616332616, "loss": 0.0229, "step": 21590 }, { "epoch": 0.23, "learning_rate": 0.0002649737302977233, "loss": 0.0245, "step": 21600 }, { "epoch": 0.23, "learning_rate": 0.00026495751443212035, "loss": 0.0248, "step": 21610 }, { "epoch": 0.23, "learning_rate": 0.00026494129856651747, "loss": 0.0236, "step": 21620 }, { "epoch": 0.23, "learning_rate": 0.00026492508270091453, "loss": 0.0255, "step": 21630 }, { "epoch": 0.23, "learning_rate": 0.00026490886683531165, "loss": 0.029, "step": 21640 }, { "epoch": 0.23, "learning_rate": 0.0002648926509697087, "loss": 0.022, "step": 21650 }, { "epoch": 0.23, "learning_rate": 0.00026487643510410584, "loss": 0.0257, "step": 21660 }, { "epoch": 0.23, "learning_rate": 0.00026486021923850296, "loss": 0.0243, "step": 21670 }, { "epoch": 0.23, "learning_rate": 0.0002648440033729, "loss": 0.0272, "step": 21680 }, { "epoch": 0.23, "learning_rate": 0.0002648277875072971, "loss": 0.0279, "step": 21690 }, { "epoch": 0.23, "learning_rate": 0.0002648115716416942, "loss": 0.0259, "step": 21700 }, { "epoch": 0.23, "learning_rate": 0.00026479535577609133, "loss": 0.0236, "step": 21710 }, { "epoch": 0.23, "learning_rate": 0.0002647791399104884, "loss": 0.0248, "step": 21720 }, { "epoch": 0.23, "learning_rate": 0.00026476292404488546, "loss": 0.0269, "step": 21730 }, { "epoch": 0.24, "learning_rate": 0.0002647467081792826, "loss": 0.0268, "step": 21740 }, { "epoch": 0.24, "learning_rate": 0.0002647304923136797, "loss": 0.0235, "step": 21750 }, { "epoch": 0.24, "learning_rate": 0.00026471427644807677, "loss": 0.0316, "step": 21760 }, { "epoch": 0.24, "learning_rate": 0.0002646980605824739, "loss": 0.0272, "step": 21770 }, { "epoch": 0.24, "learning_rate": 0.00026468184471687095, "loss": 0.0294, "step": 21780 }, { "epoch": 0.24, "learning_rate": 0.00026466562885126807, "loss": 0.0239, "step": 21790 }, { "epoch": 0.24, "learning_rate": 0.0002646494129856652, "loss": 0.0286, "step": 21800 }, { "epoch": 0.24, "learning_rate": 0.00026463319712006226, "loss": 0.0334, "step": 21810 }, { "epoch": 0.24, "learning_rate": 0.0002646169812544593, "loss": 0.0255, "step": 21820 }, { "epoch": 0.24, "learning_rate": 0.00026460076538885644, "loss": 0.0279, "step": 21830 }, { "epoch": 0.24, "learning_rate": 0.00026458454952325356, "loss": 0.0309, "step": 21840 }, { "epoch": 0.24, "learning_rate": 0.0002645683336576506, "loss": 0.0284, "step": 21850 }, { "epoch": 0.24, "learning_rate": 0.0002645521177920477, "loss": 0.027, "step": 21860 }, { "epoch": 0.24, "learning_rate": 0.0002645359019264448, "loss": 0.0314, "step": 21870 }, { "epoch": 0.24, "learning_rate": 0.00026451968606084193, "loss": 0.0273, "step": 21880 }, { "epoch": 0.24, "learning_rate": 0.000264503470195239, "loss": 0.026, "step": 21890 }, { "epoch": 0.24, "learning_rate": 0.00026448725432963606, "loss": 0.0251, "step": 21900 }, { "epoch": 0.24, "learning_rate": 0.0002644710384640332, "loss": 0.0225, "step": 21910 }, { "epoch": 0.24, "learning_rate": 0.0002644548225984303, "loss": 0.0211, "step": 21920 }, { "epoch": 0.24, "learning_rate": 0.00026443860673282737, "loss": 0.027, "step": 21930 }, { "epoch": 0.24, "learning_rate": 0.0002644223908672245, "loss": 0.0245, "step": 21940 }, { "epoch": 0.24, "learning_rate": 0.00026440617500162155, "loss": 0.0269, "step": 21950 }, { "epoch": 0.24, "learning_rate": 0.0002643899591360187, "loss": 0.027, "step": 21960 }, { "epoch": 0.24, "learning_rate": 0.00026437374327041574, "loss": 0.0299, "step": 21970 }, { "epoch": 0.24, "learning_rate": 0.00026435752740481286, "loss": 0.026, "step": 21980 }, { "epoch": 0.24, "learning_rate": 0.0002643413115392099, "loss": 0.0299, "step": 21990 }, { "epoch": 0.24, "learning_rate": 0.00026432509567360705, "loss": 0.0258, "step": 22000 }, { "epoch": 0.24, "eval_cer": 0.9216268238490577, "eval_loss": 0.019485387951135635, "eval_runtime": 120.4283, "eval_samples_per_second": 16.607, "eval_steps_per_second": 4.152, "step": 22000 }, { "epoch": 0.24, "learning_rate": 0.0002643088798080041, "loss": 0.0258, "step": 22010 }, { "epoch": 0.24, "learning_rate": 0.00026429266394240123, "loss": 0.0266, "step": 22020 }, { "epoch": 0.24, "learning_rate": 0.0002642764480767983, "loss": 0.0296, "step": 22030 }, { "epoch": 0.24, "learning_rate": 0.0002642602322111954, "loss": 0.0248, "step": 22040 }, { "epoch": 0.24, "learning_rate": 0.0002642440163455925, "loss": 0.0365, "step": 22050 }, { "epoch": 0.24, "learning_rate": 0.0002642278004799896, "loss": 0.0311, "step": 22060 }, { "epoch": 0.24, "learning_rate": 0.0002642115846143867, "loss": 0.035, "step": 22070 }, { "epoch": 0.24, "learning_rate": 0.0002641953687487838, "loss": 0.0285, "step": 22080 }, { "epoch": 0.24, "learning_rate": 0.00026417915288318085, "loss": 0.028, "step": 22090 }, { "epoch": 0.24, "learning_rate": 0.00026416293701757797, "loss": 0.0277, "step": 22100 }, { "epoch": 0.24, "learning_rate": 0.0002641467211519751, "loss": 0.027, "step": 22110 }, { "epoch": 0.24, "learning_rate": 0.00026413050528637216, "loss": 0.028, "step": 22120 }, { "epoch": 0.24, "learning_rate": 0.0002641142894207692, "loss": 0.0245, "step": 22130 }, { "epoch": 0.24, "learning_rate": 0.00026409807355516634, "loss": 0.028, "step": 22140 }, { "epoch": 0.24, "learning_rate": 0.00026408185768956346, "loss": 0.0307, "step": 22150 }, { "epoch": 0.24, "learning_rate": 0.00026406564182396053, "loss": 0.0273, "step": 22160 }, { "epoch": 0.24, "learning_rate": 0.0002640494259583576, "loss": 0.0288, "step": 22170 }, { "epoch": 0.24, "learning_rate": 0.0002640332100927547, "loss": 0.0297, "step": 22180 }, { "epoch": 0.24, "learning_rate": 0.00026401699422715183, "loss": 0.0314, "step": 22190 }, { "epoch": 0.24, "learning_rate": 0.0002640007783615489, "loss": 0.0275, "step": 22200 }, { "epoch": 0.24, "learning_rate": 0.000263984562495946, "loss": 0.0258, "step": 22210 }, { "epoch": 0.24, "learning_rate": 0.0002639683466303431, "loss": 0.0315, "step": 22220 }, { "epoch": 0.24, "learning_rate": 0.0002639521307647402, "loss": 0.0347, "step": 22230 }, { "epoch": 0.24, "learning_rate": 0.0002639359148991373, "loss": 0.0277, "step": 22240 }, { "epoch": 0.24, "learning_rate": 0.0002639196990335344, "loss": 0.0286, "step": 22250 }, { "epoch": 0.24, "learning_rate": 0.00026390348316793146, "loss": 0.0313, "step": 22260 }, { "epoch": 0.24, "learning_rate": 0.0002638872673023286, "loss": 0.0325, "step": 22270 }, { "epoch": 0.24, "learning_rate": 0.0002638710514367257, "loss": 0.0272, "step": 22280 }, { "epoch": 0.24, "learning_rate": 0.00026385483557112276, "loss": 0.0327, "step": 22290 }, { "epoch": 0.24, "learning_rate": 0.00026383861970551983, "loss": 0.0262, "step": 22300 }, { "epoch": 0.24, "learning_rate": 0.00026382240383991695, "loss": 0.0326, "step": 22310 }, { "epoch": 0.24, "learning_rate": 0.00026380618797431407, "loss": 0.03, "step": 22320 }, { "epoch": 0.24, "learning_rate": 0.00026378997210871113, "loss": 0.0275, "step": 22330 }, { "epoch": 0.24, "learning_rate": 0.0002637737562431082, "loss": 0.0447, "step": 22340 }, { "epoch": 0.24, "learning_rate": 0.0002637575403775053, "loss": 0.0503, "step": 22350 }, { "epoch": 0.24, "learning_rate": 0.00026374132451190244, "loss": 0.0397, "step": 22360 }, { "epoch": 0.24, "learning_rate": 0.00026372510864629956, "loss": 0.0425, "step": 22370 }, { "epoch": 0.24, "learning_rate": 0.0002637088927806966, "loss": 0.0306, "step": 22380 }, { "epoch": 0.24, "learning_rate": 0.0002636926769150937, "loss": 0.0366, "step": 22390 }, { "epoch": 0.24, "learning_rate": 0.0002636764610494908, "loss": 0.0283, "step": 22400 }, { "epoch": 0.24, "learning_rate": 0.00026366024518388793, "loss": 0.0284, "step": 22410 }, { "epoch": 0.24, "learning_rate": 0.000263644029318285, "loss": 0.0279, "step": 22420 }, { "epoch": 0.24, "learning_rate": 0.00026362781345268206, "loss": 0.0276, "step": 22430 }, { "epoch": 0.24, "learning_rate": 0.0002636115975870792, "loss": 0.0264, "step": 22440 }, { "epoch": 0.24, "learning_rate": 0.0002635953817214763, "loss": 0.0272, "step": 22450 }, { "epoch": 0.24, "learning_rate": 0.00026357916585587337, "loss": 0.029, "step": 22460 }, { "epoch": 0.24, "learning_rate": 0.00026356294999027043, "loss": 0.0289, "step": 22470 }, { "epoch": 0.24, "learning_rate": 0.00026354673412466755, "loss": 0.0218, "step": 22480 }, { "epoch": 0.24, "learning_rate": 0.00026353051825906467, "loss": 0.0335, "step": 22490 }, { "epoch": 0.24, "learning_rate": 0.00026351430239346174, "loss": 0.0304, "step": 22500 }, { "epoch": 0.24, "learning_rate": 0.00026349808652785886, "loss": 0.0286, "step": 22510 }, { "epoch": 0.24, "learning_rate": 0.0002634818706622559, "loss": 0.0296, "step": 22520 }, { "epoch": 0.24, "learning_rate": 0.00026346565479665304, "loss": 0.0294, "step": 22530 }, { "epoch": 0.24, "learning_rate": 0.0002634494389310501, "loss": 0.0295, "step": 22540 }, { "epoch": 0.24, "learning_rate": 0.00026343322306544723, "loss": 0.0267, "step": 22550 }, { "epoch": 0.24, "learning_rate": 0.0002634170071998443, "loss": 0.028, "step": 22560 }, { "epoch": 0.24, "learning_rate": 0.0002634007913342414, "loss": 0.0287, "step": 22570 }, { "epoch": 0.24, "learning_rate": 0.0002633845754686385, "loss": 0.0312, "step": 22580 }, { "epoch": 0.24, "learning_rate": 0.0002633683596030356, "loss": 0.0336, "step": 22590 }, { "epoch": 0.24, "learning_rate": 0.00026335214373743266, "loss": 0.0285, "step": 22600 }, { "epoch": 0.24, "learning_rate": 0.0002633359278718298, "loss": 0.0269, "step": 22610 }, { "epoch": 0.24, "learning_rate": 0.00026331971200622685, "loss": 0.029, "step": 22620 }, { "epoch": 0.24, "learning_rate": 0.00026330349614062397, "loss": 0.0227, "step": 22630 }, { "epoch": 0.24, "learning_rate": 0.00026328728027502103, "loss": 0.0312, "step": 22640 }, { "epoch": 0.24, "learning_rate": 0.00026327106440941815, "loss": 0.0253, "step": 22650 }, { "epoch": 0.24, "learning_rate": 0.0002632548485438152, "loss": 0.0313, "step": 22660 }, { "epoch": 0.25, "learning_rate": 0.00026323863267821234, "loss": 0.0268, "step": 22670 }, { "epoch": 0.25, "learning_rate": 0.00026322241681260946, "loss": 0.0263, "step": 22680 }, { "epoch": 0.25, "learning_rate": 0.0002632062009470065, "loss": 0.0246, "step": 22690 }, { "epoch": 0.25, "learning_rate": 0.0002631899850814036, "loss": 0.0256, "step": 22700 }, { "epoch": 0.25, "learning_rate": 0.0002631737692158007, "loss": 0.025, "step": 22710 }, { "epoch": 0.25, "learning_rate": 0.00026315755335019783, "loss": 0.029, "step": 22720 }, { "epoch": 0.25, "learning_rate": 0.0002631413374845949, "loss": 0.0254, "step": 22730 }, { "epoch": 0.25, "learning_rate": 0.00026312512161899196, "loss": 0.0325, "step": 22740 }, { "epoch": 0.25, "learning_rate": 0.0002631089057533891, "loss": 0.0269, "step": 22750 }, { "epoch": 0.25, "learning_rate": 0.0002630926898877862, "loss": 0.0272, "step": 22760 }, { "epoch": 0.25, "learning_rate": 0.00026307647402218327, "loss": 0.0253, "step": 22770 }, { "epoch": 0.25, "learning_rate": 0.0002630602581565804, "loss": 0.0229, "step": 22780 }, { "epoch": 0.25, "learning_rate": 0.00026304404229097745, "loss": 0.0286, "step": 22790 }, { "epoch": 0.25, "learning_rate": 0.0002630278264253746, "loss": 0.0285, "step": 22800 }, { "epoch": 0.25, "learning_rate": 0.0002630116105597717, "loss": 0.0288, "step": 22810 }, { "epoch": 0.25, "learning_rate": 0.00026299539469416876, "loss": 0.0251, "step": 22820 }, { "epoch": 0.25, "learning_rate": 0.0002629791788285658, "loss": 0.0244, "step": 22830 }, { "epoch": 0.25, "learning_rate": 0.00026296296296296294, "loss": 0.025, "step": 22840 }, { "epoch": 0.25, "learning_rate": 0.00026294674709736006, "loss": 0.025, "step": 22850 }, { "epoch": 0.25, "learning_rate": 0.00026293053123175713, "loss": 0.0247, "step": 22860 }, { "epoch": 0.25, "learning_rate": 0.0002629143153661542, "loss": 0.0261, "step": 22870 }, { "epoch": 0.25, "learning_rate": 0.0002628980995005513, "loss": 0.0298, "step": 22880 }, { "epoch": 0.25, "learning_rate": 0.00026288188363494843, "loss": 0.0257, "step": 22890 }, { "epoch": 0.25, "learning_rate": 0.0002628656677693455, "loss": 0.0316, "step": 22900 }, { "epoch": 0.25, "learning_rate": 0.00026284945190374257, "loss": 0.0259, "step": 22910 }, { "epoch": 0.25, "learning_rate": 0.0002628332360381397, "loss": 0.0278, "step": 22920 }, { "epoch": 0.25, "learning_rate": 0.0002628170201725368, "loss": 0.0284, "step": 22930 }, { "epoch": 0.25, "learning_rate": 0.00026280080430693387, "loss": 0.0245, "step": 22940 }, { "epoch": 0.25, "learning_rate": 0.000262784588441331, "loss": 0.0262, "step": 22950 }, { "epoch": 0.25, "learning_rate": 0.00026276837257572806, "loss": 0.0276, "step": 22960 }, { "epoch": 0.25, "learning_rate": 0.0002627521567101252, "loss": 0.0271, "step": 22970 }, { "epoch": 0.25, "learning_rate": 0.00026273594084452224, "loss": 0.026, "step": 22980 }, { "epoch": 0.25, "learning_rate": 0.00026271972497891936, "loss": 0.0259, "step": 22990 }, { "epoch": 0.25, "learning_rate": 0.00026270350911331643, "loss": 0.0247, "step": 23000 }, { "epoch": 0.25, "eval_cer": 0.9215642844361985, "eval_loss": 0.018794536590576172, "eval_runtime": 119.88, "eval_samples_per_second": 16.683, "eval_steps_per_second": 4.171, "step": 23000 }, { "epoch": 0.25, "learning_rate": 0.00026268729324771355, "loss": 0.0282, "step": 23010 }, { "epoch": 0.25, "learning_rate": 0.00026267107738211067, "loss": 0.0299, "step": 23020 }, { "epoch": 0.25, "learning_rate": 0.00026265486151650773, "loss": 0.0276, "step": 23030 }, { "epoch": 0.25, "learning_rate": 0.0002626386456509048, "loss": 0.0255, "step": 23040 }, { "epoch": 0.25, "learning_rate": 0.0002626224297853019, "loss": 0.0257, "step": 23050 }, { "epoch": 0.25, "learning_rate": 0.00026260621391969904, "loss": 0.0253, "step": 23060 }, { "epoch": 0.25, "learning_rate": 0.0002625899980540961, "loss": 0.0266, "step": 23070 }, { "epoch": 0.25, "learning_rate": 0.0002625737821884932, "loss": 0.026, "step": 23080 }, { "epoch": 0.25, "learning_rate": 0.0002625575663228903, "loss": 0.0296, "step": 23090 }, { "epoch": 0.25, "learning_rate": 0.0002625413504572874, "loss": 0.0235, "step": 23100 }, { "epoch": 0.25, "learning_rate": 0.0002625251345916845, "loss": 0.027, "step": 23110 }, { "epoch": 0.25, "learning_rate": 0.0002625089187260816, "loss": 0.027, "step": 23120 }, { "epoch": 0.25, "learning_rate": 0.00026249270286047866, "loss": 0.0263, "step": 23130 }, { "epoch": 0.25, "learning_rate": 0.0002624764869948758, "loss": 0.0239, "step": 23140 }, { "epoch": 0.25, "learning_rate": 0.00026246027112927285, "loss": 0.02, "step": 23150 }, { "epoch": 0.25, "learning_rate": 0.00026244405526366997, "loss": 0.0264, "step": 23160 }, { "epoch": 0.25, "learning_rate": 0.00026242783939806703, "loss": 0.0259, "step": 23170 }, { "epoch": 0.25, "learning_rate": 0.00026241162353246415, "loss": 0.0247, "step": 23180 }, { "epoch": 0.25, "learning_rate": 0.0002623954076668612, "loss": 0.0236, "step": 23190 }, { "epoch": 0.25, "learning_rate": 0.00026237919180125834, "loss": 0.0233, "step": 23200 }, { "epoch": 0.25, "learning_rate": 0.0002623629759356554, "loss": 0.0241, "step": 23210 }, { "epoch": 0.25, "learning_rate": 0.0002623467600700525, "loss": 0.0303, "step": 23220 }, { "epoch": 0.25, "learning_rate": 0.0002623305442044496, "loss": 0.0266, "step": 23230 }, { "epoch": 0.25, "learning_rate": 0.0002623143283388467, "loss": 0.0269, "step": 23240 }, { "epoch": 0.25, "learning_rate": 0.00026229811247324383, "loss": 0.0215, "step": 23250 }, { "epoch": 0.25, "learning_rate": 0.0002622818966076409, "loss": 0.0261, "step": 23260 }, { "epoch": 0.25, "learning_rate": 0.00026226568074203796, "loss": 0.025, "step": 23270 }, { "epoch": 0.25, "learning_rate": 0.0002622494648764351, "loss": 0.0272, "step": 23280 }, { "epoch": 0.25, "learning_rate": 0.0002622332490108322, "loss": 0.0271, "step": 23290 }, { "epoch": 0.25, "learning_rate": 0.00026221703314522926, "loss": 0.0259, "step": 23300 }, { "epoch": 0.25, "learning_rate": 0.00026220081727962633, "loss": 0.0246, "step": 23310 }, { "epoch": 0.25, "learning_rate": 0.00026218460141402345, "loss": 0.0229, "step": 23320 }, { "epoch": 0.25, "learning_rate": 0.00026216838554842057, "loss": 0.0266, "step": 23330 }, { "epoch": 0.25, "learning_rate": 0.00026215216968281764, "loss": 0.0215, "step": 23340 }, { "epoch": 0.25, "learning_rate": 0.0002621359538172147, "loss": 0.0284, "step": 23350 }, { "epoch": 0.25, "learning_rate": 0.0002621197379516118, "loss": 0.023, "step": 23360 }, { "epoch": 0.25, "learning_rate": 0.00026210352208600894, "loss": 0.0237, "step": 23370 }, { "epoch": 0.25, "learning_rate": 0.00026208730622040606, "loss": 0.0293, "step": 23380 }, { "epoch": 0.25, "learning_rate": 0.0002620710903548031, "loss": 0.0329, "step": 23390 }, { "epoch": 0.25, "learning_rate": 0.0002620548744892002, "loss": 0.0271, "step": 23400 }, { "epoch": 0.25, "learning_rate": 0.0002620386586235973, "loss": 0.0272, "step": 23410 }, { "epoch": 0.25, "learning_rate": 0.00026202244275799443, "loss": 0.0236, "step": 23420 }, { "epoch": 0.25, "learning_rate": 0.0002620062268923915, "loss": 0.0231, "step": 23430 }, { "epoch": 0.25, "learning_rate": 0.00026199001102678856, "loss": 0.0228, "step": 23440 }, { "epoch": 0.25, "learning_rate": 0.0002619737951611857, "loss": 0.029, "step": 23450 }, { "epoch": 0.25, "learning_rate": 0.0002619575792955828, "loss": 0.0253, "step": 23460 }, { "epoch": 0.25, "learning_rate": 0.00026194136342997987, "loss": 0.027, "step": 23470 }, { "epoch": 0.25, "learning_rate": 0.00026192514756437693, "loss": 0.0263, "step": 23480 }, { "epoch": 0.25, "learning_rate": 0.00026190893169877405, "loss": 0.0268, "step": 23490 }, { "epoch": 0.25, "learning_rate": 0.0002618927158331712, "loss": 0.0408, "step": 23500 }, { "epoch": 0.25, "learning_rate": 0.00026187649996756824, "loss": 0.0305, "step": 23510 }, { "epoch": 0.25, "learning_rate": 0.00026186028410196536, "loss": 0.027, "step": 23520 }, { "epoch": 0.25, "learning_rate": 0.0002618440682363624, "loss": 0.0306, "step": 23530 }, { "epoch": 0.25, "learning_rate": 0.00026182785237075954, "loss": 0.0336, "step": 23540 }, { "epoch": 0.25, "learning_rate": 0.0002618116365051566, "loss": 0.0327, "step": 23550 }, { "epoch": 0.25, "learning_rate": 0.00026179542063955373, "loss": 0.028, "step": 23560 }, { "epoch": 0.25, "learning_rate": 0.0002617792047739508, "loss": 0.0262, "step": 23570 }, { "epoch": 0.25, "learning_rate": 0.0002617629889083479, "loss": 0.0314, "step": 23580 }, { "epoch": 0.26, "learning_rate": 0.000261746773042745, "loss": 0.0295, "step": 23590 }, { "epoch": 0.26, "learning_rate": 0.0002617305571771421, "loss": 0.0256, "step": 23600 }, { "epoch": 0.26, "learning_rate": 0.00026171434131153917, "loss": 0.0263, "step": 23610 }, { "epoch": 0.26, "learning_rate": 0.0002616981254459363, "loss": 0.0272, "step": 23620 }, { "epoch": 0.26, "learning_rate": 0.00026168190958033335, "loss": 0.0237, "step": 23630 }, { "epoch": 0.26, "learning_rate": 0.00026166569371473047, "loss": 0.0305, "step": 23640 }, { "epoch": 0.26, "learning_rate": 0.00026164947784912754, "loss": 0.0235, "step": 23650 }, { "epoch": 0.26, "learning_rate": 0.00026163326198352466, "loss": 0.0257, "step": 23660 }, { "epoch": 0.26, "learning_rate": 0.0002616170461179217, "loss": 0.0241, "step": 23670 }, { "epoch": 0.26, "learning_rate": 0.00026160083025231884, "loss": 0.0232, "step": 23680 }, { "epoch": 0.26, "learning_rate": 0.00026158461438671596, "loss": 0.0265, "step": 23690 }, { "epoch": 0.26, "learning_rate": 0.00026156839852111303, "loss": 0.0316, "step": 23700 }, { "epoch": 0.26, "learning_rate": 0.0002615521826555101, "loss": 0.0284, "step": 23710 }, { "epoch": 0.26, "learning_rate": 0.0002615359667899072, "loss": 0.025, "step": 23720 }, { "epoch": 0.26, "learning_rate": 0.00026151975092430433, "loss": 0.0272, "step": 23730 }, { "epoch": 0.26, "learning_rate": 0.0002615035350587014, "loss": 0.0241, "step": 23740 }, { "epoch": 0.26, "learning_rate": 0.0002614873191930985, "loss": 0.0252, "step": 23750 }, { "epoch": 0.26, "learning_rate": 0.0002614711033274956, "loss": 0.0222, "step": 23760 }, { "epoch": 0.26, "learning_rate": 0.0002614548874618927, "loss": 0.0227, "step": 23770 }, { "epoch": 0.26, "learning_rate": 0.00026143867159628977, "loss": 0.0225, "step": 23780 }, { "epoch": 0.26, "learning_rate": 0.0002614224557306869, "loss": 0.0233, "step": 23790 }, { "epoch": 0.26, "learning_rate": 0.00026140623986508396, "loss": 0.0216, "step": 23800 }, { "epoch": 0.26, "learning_rate": 0.0002613900239994811, "loss": 0.0234, "step": 23810 }, { "epoch": 0.26, "learning_rate": 0.0002613738081338782, "loss": 0.0233, "step": 23820 }, { "epoch": 0.26, "learning_rate": 0.00026135759226827526, "loss": 0.027, "step": 23830 }, { "epoch": 0.26, "learning_rate": 0.0002613413764026723, "loss": 0.0448, "step": 23840 }, { "epoch": 0.26, "learning_rate": 0.00026132516053706945, "loss": 0.0293, "step": 23850 }, { "epoch": 0.26, "learning_rate": 0.00026130894467146657, "loss": 0.0267, "step": 23860 }, { "epoch": 0.26, "learning_rate": 0.00026129272880586363, "loss": 0.0289, "step": 23870 }, { "epoch": 0.26, "learning_rate": 0.0002612765129402607, "loss": 0.0332, "step": 23880 }, { "epoch": 0.26, "learning_rate": 0.0002612602970746578, "loss": 0.0336, "step": 23890 }, { "epoch": 0.26, "learning_rate": 0.00026124408120905494, "loss": 0.0275, "step": 23900 }, { "epoch": 0.26, "learning_rate": 0.000261227865343452, "loss": 0.0261, "step": 23910 }, { "epoch": 0.26, "learning_rate": 0.00026121164947784907, "loss": 0.0259, "step": 23920 }, { "epoch": 0.26, "learning_rate": 0.0002611954336122462, "loss": 0.0236, "step": 23930 }, { "epoch": 0.26, "learning_rate": 0.0002611792177466433, "loss": 0.0238, "step": 23940 }, { "epoch": 0.26, "learning_rate": 0.00026116300188104043, "loss": 0.0291, "step": 23950 }, { "epoch": 0.26, "learning_rate": 0.0002611467860154375, "loss": 0.0276, "step": 23960 }, { "epoch": 0.26, "learning_rate": 0.00026113057014983456, "loss": 0.0274, "step": 23970 }, { "epoch": 0.26, "learning_rate": 0.0002611143542842317, "loss": 0.0258, "step": 23980 }, { "epoch": 0.26, "learning_rate": 0.0002610981384186288, "loss": 0.0264, "step": 23990 }, { "epoch": 0.26, "learning_rate": 0.00026108192255302586, "loss": 0.0285, "step": 24000 }, { "epoch": 0.26, "eval_cer": 0.9215486495829838, "eval_loss": 0.019064895808696747, "eval_runtime": 119.9759, "eval_samples_per_second": 16.67, "eval_steps_per_second": 4.168, "step": 24000 }, { "epoch": 0.26, "learning_rate": 0.00026106570668742293, "loss": 0.0229, "step": 24010 }, { "epoch": 0.26, "learning_rate": 0.00026104949082182005, "loss": 0.0273, "step": 24020 }, { "epoch": 0.26, "learning_rate": 0.00026103327495621717, "loss": 0.0242, "step": 24030 }, { "epoch": 0.26, "learning_rate": 0.00026101705909061424, "loss": 0.0285, "step": 24040 }, { "epoch": 0.26, "learning_rate": 0.0002610008432250113, "loss": 0.0284, "step": 24050 }, { "epoch": 0.26, "learning_rate": 0.0002609846273594084, "loss": 0.0254, "step": 24060 }, { "epoch": 0.26, "learning_rate": 0.00026096841149380554, "loss": 0.0238, "step": 24070 }, { "epoch": 0.26, "learning_rate": 0.0002609521956282026, "loss": 0.024, "step": 24080 }, { "epoch": 0.26, "learning_rate": 0.0002609359797625997, "loss": 0.0265, "step": 24090 }, { "epoch": 0.26, "learning_rate": 0.0002609197638969968, "loss": 0.0284, "step": 24100 }, { "epoch": 0.26, "learning_rate": 0.0002609035480313939, "loss": 0.0276, "step": 24110 }, { "epoch": 0.26, "learning_rate": 0.000260887332165791, "loss": 0.0275, "step": 24120 }, { "epoch": 0.26, "learning_rate": 0.0002608711163001881, "loss": 0.0306, "step": 24130 }, { "epoch": 0.26, "learning_rate": 0.00026085490043458516, "loss": 0.027, "step": 24140 }, { "epoch": 0.26, "learning_rate": 0.0002608386845689823, "loss": 0.0293, "step": 24150 }, { "epoch": 0.26, "learning_rate": 0.00026082246870337935, "loss": 0.0274, "step": 24160 }, { "epoch": 0.26, "learning_rate": 0.00026080625283777647, "loss": 0.0292, "step": 24170 }, { "epoch": 0.26, "learning_rate": 0.00026079003697217353, "loss": 0.0254, "step": 24180 }, { "epoch": 0.26, "learning_rate": 0.00026077382110657065, "loss": 0.0267, "step": 24190 }, { "epoch": 0.26, "learning_rate": 0.0002607576052409677, "loss": 0.0262, "step": 24200 }, { "epoch": 0.26, "learning_rate": 0.00026074138937536484, "loss": 0.0279, "step": 24210 }, { "epoch": 0.26, "learning_rate": 0.0002607251735097619, "loss": 0.032, "step": 24220 }, { "epoch": 0.26, "learning_rate": 0.000260708957644159, "loss": 0.0244, "step": 24230 }, { "epoch": 0.26, "learning_rate": 0.0002606927417785561, "loss": 0.0242, "step": 24240 }, { "epoch": 0.26, "learning_rate": 0.0002606765259129532, "loss": 0.0262, "step": 24250 }, { "epoch": 0.26, "learning_rate": 0.00026066031004735033, "loss": 0.0232, "step": 24260 }, { "epoch": 0.26, "learning_rate": 0.0002606440941817474, "loss": 0.0265, "step": 24270 }, { "epoch": 0.26, "learning_rate": 0.00026062787831614446, "loss": 0.026, "step": 24280 }, { "epoch": 0.26, "learning_rate": 0.0002606116624505416, "loss": 0.0259, "step": 24290 }, { "epoch": 0.26, "learning_rate": 0.0002605954465849387, "loss": 0.0264, "step": 24300 }, { "epoch": 0.26, "learning_rate": 0.00026057923071933577, "loss": 0.0246, "step": 24310 }, { "epoch": 0.26, "learning_rate": 0.00026056301485373283, "loss": 0.0276, "step": 24320 }, { "epoch": 0.26, "learning_rate": 0.00026054679898812995, "loss": 0.0271, "step": 24330 }, { "epoch": 0.26, "learning_rate": 0.00026053058312252707, "loss": 0.0256, "step": 24340 }, { "epoch": 0.26, "learning_rate": 0.00026051436725692414, "loss": 0.0259, "step": 24350 }, { "epoch": 0.26, "learning_rate": 0.0002604981513913212, "loss": 0.0223, "step": 24360 }, { "epoch": 0.26, "learning_rate": 0.0002604819355257183, "loss": 0.0231, "step": 24370 }, { "epoch": 0.26, "learning_rate": 0.00026046571966011544, "loss": 0.0276, "step": 24380 }, { "epoch": 0.26, "learning_rate": 0.00026044950379451256, "loss": 0.0235, "step": 24390 }, { "epoch": 0.26, "learning_rate": 0.00026043328792890963, "loss": 0.0226, "step": 24400 }, { "epoch": 0.26, "learning_rate": 0.0002604170720633067, "loss": 0.026, "step": 24410 }, { "epoch": 0.26, "learning_rate": 0.0002604008561977038, "loss": 0.0224, "step": 24420 }, { "epoch": 0.26, "learning_rate": 0.00026038464033210093, "loss": 0.0251, "step": 24430 }, { "epoch": 0.26, "learning_rate": 0.000260368424466498, "loss": 0.0275, "step": 24440 }, { "epoch": 0.26, "learning_rate": 0.00026035220860089507, "loss": 0.0268, "step": 24450 }, { "epoch": 0.26, "learning_rate": 0.0002603359927352922, "loss": 0.0218, "step": 24460 }, { "epoch": 0.26, "learning_rate": 0.0002603197768696893, "loss": 0.0218, "step": 24470 }, { "epoch": 0.26, "learning_rate": 0.00026030356100408637, "loss": 0.0259, "step": 24480 }, { "epoch": 0.26, "learning_rate": 0.00026028734513848344, "loss": 0.0258, "step": 24490 }, { "epoch": 0.26, "learning_rate": 0.00026027112927288056, "loss": 0.0277, "step": 24500 }, { "epoch": 0.26, "learning_rate": 0.0002602549134072777, "loss": 0.0236, "step": 24510 }, { "epoch": 0.27, "learning_rate": 0.00026023869754167474, "loss": 0.0223, "step": 24520 }, { "epoch": 0.27, "learning_rate": 0.00026022248167607186, "loss": 0.0299, "step": 24530 }, { "epoch": 0.27, "learning_rate": 0.00026020626581046893, "loss": 0.0246, "step": 24540 }, { "epoch": 0.27, "learning_rate": 0.00026019004994486605, "loss": 0.0231, "step": 24550 }, { "epoch": 0.27, "learning_rate": 0.00026017383407926317, "loss": 0.022, "step": 24560 }, { "epoch": 0.27, "learning_rate": 0.00026015761821366023, "loss": 0.0283, "step": 24570 }, { "epoch": 0.27, "learning_rate": 0.0002601414023480573, "loss": 0.0256, "step": 24580 }, { "epoch": 0.27, "learning_rate": 0.0002601251864824544, "loss": 0.0238, "step": 24590 }, { "epoch": 0.27, "learning_rate": 0.00026010897061685154, "loss": 0.0251, "step": 24600 }, { "epoch": 0.27, "learning_rate": 0.0002600927547512486, "loss": 0.0264, "step": 24610 }, { "epoch": 0.27, "learning_rate": 0.00026007653888564567, "loss": 0.03, "step": 24620 }, { "epoch": 0.27, "learning_rate": 0.0002600603230200428, "loss": 0.0245, "step": 24630 }, { "epoch": 0.27, "learning_rate": 0.0002600441071544399, "loss": 0.0227, "step": 24640 }, { "epoch": 0.27, "learning_rate": 0.000260027891288837, "loss": 0.0248, "step": 24650 }, { "epoch": 0.27, "learning_rate": 0.00026001167542323404, "loss": 0.03, "step": 24660 }, { "epoch": 0.27, "learning_rate": 0.00025999545955763116, "loss": 0.024, "step": 24670 }, { "epoch": 0.27, "learning_rate": 0.0002599792436920283, "loss": 0.0246, "step": 24680 }, { "epoch": 0.27, "learning_rate": 0.00025996302782642535, "loss": 0.0231, "step": 24690 }, { "epoch": 0.27, "learning_rate": 0.00025994681196082247, "loss": 0.0296, "step": 24700 }, { "epoch": 0.27, "learning_rate": 0.00025993059609521953, "loss": 0.0241, "step": 24710 }, { "epoch": 0.27, "learning_rate": 0.00025991438022961665, "loss": 0.0223, "step": 24720 }, { "epoch": 0.27, "learning_rate": 0.0002598981643640137, "loss": 0.0225, "step": 24730 }, { "epoch": 0.27, "learning_rate": 0.00025988194849841084, "loss": 0.0282, "step": 24740 }, { "epoch": 0.27, "learning_rate": 0.0002598657326328079, "loss": 0.0279, "step": 24750 }, { "epoch": 0.27, "learning_rate": 0.000259849516767205, "loss": 0.0249, "step": 24760 }, { "epoch": 0.27, "learning_rate": 0.0002598333009016021, "loss": 0.0252, "step": 24770 }, { "epoch": 0.27, "learning_rate": 0.0002598170850359992, "loss": 0.0307, "step": 24780 }, { "epoch": 0.27, "learning_rate": 0.00025980086917039627, "loss": 0.0254, "step": 24790 }, { "epoch": 0.27, "learning_rate": 0.0002597846533047934, "loss": 0.025, "step": 24800 }, { "epoch": 0.27, "learning_rate": 0.00025976843743919046, "loss": 0.0263, "step": 24810 }, { "epoch": 0.27, "learning_rate": 0.0002597522215735876, "loss": 0.0244, "step": 24820 }, { "epoch": 0.27, "learning_rate": 0.0002597360057079847, "loss": 0.0255, "step": 24830 }, { "epoch": 0.27, "learning_rate": 0.00025971978984238176, "loss": 0.0273, "step": 24840 }, { "epoch": 0.27, "learning_rate": 0.00025970357397677883, "loss": 0.0218, "step": 24850 }, { "epoch": 0.27, "learning_rate": 0.00025968735811117595, "loss": 0.0262, "step": 24860 }, { "epoch": 0.27, "learning_rate": 0.00025967114224557307, "loss": 0.0302, "step": 24870 }, { "epoch": 0.27, "learning_rate": 0.00025965492637997013, "loss": 0.0256, "step": 24880 }, { "epoch": 0.27, "learning_rate": 0.0002596387105143672, "loss": 0.0285, "step": 24890 }, { "epoch": 0.27, "learning_rate": 0.0002596224946487643, "loss": 0.0274, "step": 24900 }, { "epoch": 0.27, "learning_rate": 0.00025960627878316144, "loss": 0.027, "step": 24910 }, { "epoch": 0.27, "learning_rate": 0.0002595900629175585, "loss": 0.0244, "step": 24920 }, { "epoch": 0.27, "learning_rate": 0.00025957384705195557, "loss": 0.0329, "step": 24930 }, { "epoch": 0.27, "learning_rate": 0.0002595576311863527, "loss": 0.0289, "step": 24940 }, { "epoch": 0.27, "learning_rate": 0.0002595414153207498, "loss": 0.0278, "step": 24950 }, { "epoch": 0.27, "learning_rate": 0.00025952519945514693, "loss": 0.0292, "step": 24960 }, { "epoch": 0.27, "learning_rate": 0.000259508983589544, "loss": 0.028, "step": 24970 }, { "epoch": 0.27, "learning_rate": 0.00025949276772394106, "loss": 0.0306, "step": 24980 }, { "epoch": 0.27, "learning_rate": 0.0002594765518583382, "loss": 0.0266, "step": 24990 }, { "epoch": 0.27, "learning_rate": 0.0002594603359927353, "loss": 0.031, "step": 25000 }, { "epoch": 0.27, "eval_cer": 0.9215703646568931, "eval_loss": 0.019244205206632614, "eval_runtime": 120.3576, "eval_samples_per_second": 16.617, "eval_steps_per_second": 4.154, "step": 25000 }, { "epoch": 0.27, "learning_rate": 0.00025944412012713237, "loss": 0.0276, "step": 25010 }, { "epoch": 0.27, "learning_rate": 0.00025942790426152943, "loss": 0.0269, "step": 25020 }, { "epoch": 0.27, "learning_rate": 0.00025941168839592655, "loss": 0.0284, "step": 25030 }, { "epoch": 0.27, "learning_rate": 0.00025939547253032367, "loss": 0.0237, "step": 25040 }, { "epoch": 0.27, "learning_rate": 0.00025937925666472074, "loss": 0.0266, "step": 25050 }, { "epoch": 0.27, "learning_rate": 0.0002593630407991178, "loss": 0.0272, "step": 25060 }, { "epoch": 0.27, "learning_rate": 0.0002593468249335149, "loss": 0.0241, "step": 25070 }, { "epoch": 0.27, "learning_rate": 0.00025933060906791204, "loss": 0.0298, "step": 25080 }, { "epoch": 0.27, "learning_rate": 0.0002593143932023091, "loss": 0.0354, "step": 25090 }, { "epoch": 0.27, "learning_rate": 0.00025929817733670623, "loss": 0.0274, "step": 25100 }, { "epoch": 0.27, "learning_rate": 0.0002592819614711033, "loss": 0.0265, "step": 25110 }, { "epoch": 0.27, "learning_rate": 0.0002592657456055004, "loss": 0.033, "step": 25120 }, { "epoch": 0.27, "learning_rate": 0.0002592495297398975, "loss": 0.026, "step": 25130 }, { "epoch": 0.27, "learning_rate": 0.0002592333138742946, "loss": 0.0254, "step": 25140 }, { "epoch": 0.27, "learning_rate": 0.00025921709800869167, "loss": 0.0255, "step": 25150 }, { "epoch": 0.27, "learning_rate": 0.0002592008821430888, "loss": 0.0277, "step": 25160 }, { "epoch": 0.27, "learning_rate": 0.00025918466627748585, "loss": 0.0233, "step": 25170 }, { "epoch": 0.27, "learning_rate": 0.00025916845041188297, "loss": 0.0255, "step": 25180 }, { "epoch": 0.27, "learning_rate": 0.00025915223454628004, "loss": 0.0275, "step": 25190 }, { "epoch": 0.27, "learning_rate": 0.00025913601868067716, "loss": 0.025, "step": 25200 }, { "epoch": 0.27, "learning_rate": 0.0002591198028150743, "loss": 0.0225, "step": 25210 }, { "epoch": 0.27, "learning_rate": 0.00025910358694947134, "loss": 0.0277, "step": 25220 }, { "epoch": 0.27, "learning_rate": 0.0002590873710838684, "loss": 0.0254, "step": 25230 }, { "epoch": 0.27, "learning_rate": 0.00025907115521826553, "loss": 0.0253, "step": 25240 }, { "epoch": 0.27, "learning_rate": 0.00025905493935266265, "loss": 0.0242, "step": 25250 }, { "epoch": 0.27, "learning_rate": 0.0002590387234870597, "loss": 0.0235, "step": 25260 }, { "epoch": 0.27, "learning_rate": 0.00025902250762145683, "loss": 0.0245, "step": 25270 }, { "epoch": 0.27, "learning_rate": 0.0002590062917558539, "loss": 0.0262, "step": 25280 }, { "epoch": 0.27, "learning_rate": 0.000258990075890251, "loss": 0.025, "step": 25290 }, { "epoch": 0.27, "learning_rate": 0.0002589738600246481, "loss": 0.0261, "step": 25300 }, { "epoch": 0.27, "learning_rate": 0.0002589576441590452, "loss": 0.0253, "step": 25310 }, { "epoch": 0.27, "learning_rate": 0.00025894142829344227, "loss": 0.0247, "step": 25320 }, { "epoch": 0.27, "learning_rate": 0.0002589252124278394, "loss": 0.0288, "step": 25330 }, { "epoch": 0.27, "learning_rate": 0.00025890899656223646, "loss": 0.0268, "step": 25340 }, { "epoch": 0.27, "learning_rate": 0.0002588927806966336, "loss": 0.026, "step": 25350 }, { "epoch": 0.27, "learning_rate": 0.00025887656483103064, "loss": 0.0252, "step": 25360 }, { "epoch": 0.27, "learning_rate": 0.00025886034896542776, "loss": 0.0243, "step": 25370 }, { "epoch": 0.27, "learning_rate": 0.0002588441330998248, "loss": 0.0242, "step": 25380 }, { "epoch": 0.27, "learning_rate": 0.00025882791723422195, "loss": 0.0268, "step": 25390 }, { "epoch": 0.27, "learning_rate": 0.00025881170136861907, "loss": 0.0222, "step": 25400 }, { "epoch": 0.27, "learning_rate": 0.00025879548550301613, "loss": 0.0293, "step": 25410 }, { "epoch": 0.27, "learning_rate": 0.0002587792696374132, "loss": 0.0239, "step": 25420 }, { "epoch": 0.27, "learning_rate": 0.0002587630537718103, "loss": 0.0257, "step": 25430 }, { "epoch": 0.28, "learning_rate": 0.00025874683790620744, "loss": 0.0278, "step": 25440 }, { "epoch": 0.28, "learning_rate": 0.0002587306220406045, "loss": 0.0228, "step": 25450 }, { "epoch": 0.28, "learning_rate": 0.00025871440617500157, "loss": 0.0241, "step": 25460 }, { "epoch": 0.28, "learning_rate": 0.0002586981903093987, "loss": 0.0282, "step": 25470 }, { "epoch": 0.28, "learning_rate": 0.0002586819744437958, "loss": 0.0208, "step": 25480 }, { "epoch": 0.28, "learning_rate": 0.0002586657585781929, "loss": 0.0233, "step": 25490 }, { "epoch": 0.28, "learning_rate": 0.00025864954271258994, "loss": 0.0212, "step": 25500 }, { "epoch": 0.28, "learning_rate": 0.00025863332684698706, "loss": 0.024, "step": 25510 }, { "epoch": 0.28, "learning_rate": 0.0002586171109813842, "loss": 0.0255, "step": 25520 }, { "epoch": 0.28, "learning_rate": 0.00025860089511578124, "loss": 0.0315, "step": 25530 }, { "epoch": 0.28, "learning_rate": 0.00025858467925017836, "loss": 0.0256, "step": 25540 }, { "epoch": 0.28, "learning_rate": 0.00025856846338457543, "loss": 0.0263, "step": 25550 }, { "epoch": 0.28, "learning_rate": 0.00025855224751897255, "loss": 0.0252, "step": 25560 }, { "epoch": 0.28, "learning_rate": 0.00025853603165336967, "loss": 0.0228, "step": 25570 }, { "epoch": 0.28, "learning_rate": 0.00025851981578776674, "loss": 0.0229, "step": 25580 }, { "epoch": 0.28, "learning_rate": 0.0002585035999221638, "loss": 0.0274, "step": 25590 }, { "epoch": 0.28, "learning_rate": 0.0002584873840565609, "loss": 0.0268, "step": 25600 }, { "epoch": 0.28, "learning_rate": 0.00025847116819095804, "loss": 0.0292, "step": 25610 }, { "epoch": 0.28, "learning_rate": 0.0002584549523253551, "loss": 0.0276, "step": 25620 }, { "epoch": 0.28, "learning_rate": 0.00025843873645975217, "loss": 0.0248, "step": 25630 }, { "epoch": 0.28, "learning_rate": 0.0002584225205941493, "loss": 0.0257, "step": 25640 }, { "epoch": 0.28, "learning_rate": 0.0002584063047285464, "loss": 0.0283, "step": 25650 }, { "epoch": 0.28, "learning_rate": 0.0002583900888629435, "loss": 0.0327, "step": 25660 }, { "epoch": 0.28, "learning_rate": 0.00025837387299734054, "loss": 0.046, "step": 25670 }, { "epoch": 0.28, "learning_rate": 0.00025835765713173766, "loss": 0.0337, "step": 25680 }, { "epoch": 0.28, "learning_rate": 0.0002583414412661348, "loss": 0.0251, "step": 25690 }, { "epoch": 0.28, "learning_rate": 0.00025832522540053185, "loss": 0.0266, "step": 25700 }, { "epoch": 0.28, "learning_rate": 0.00025830900953492897, "loss": 0.0259, "step": 25710 }, { "epoch": 0.28, "learning_rate": 0.00025829279366932603, "loss": 0.0251, "step": 25720 }, { "epoch": 0.28, "learning_rate": 0.00025827657780372315, "loss": 0.0282, "step": 25730 }, { "epoch": 0.28, "learning_rate": 0.0002582603619381202, "loss": 0.025, "step": 25740 }, { "epoch": 0.28, "learning_rate": 0.00025824414607251734, "loss": 0.0273, "step": 25750 }, { "epoch": 0.28, "learning_rate": 0.0002582279302069144, "loss": 0.0252, "step": 25760 }, { "epoch": 0.28, "learning_rate": 0.0002582117143413115, "loss": 0.0192, "step": 25770 }, { "epoch": 0.28, "learning_rate": 0.0002581954984757086, "loss": 0.026, "step": 25780 }, { "epoch": 0.28, "learning_rate": 0.0002581792826101057, "loss": 0.0234, "step": 25790 }, { "epoch": 0.28, "learning_rate": 0.0002581630667445028, "loss": 0.0299, "step": 25800 }, { "epoch": 0.28, "learning_rate": 0.0002581468508788999, "loss": 0.0289, "step": 25810 }, { "epoch": 0.28, "learning_rate": 0.00025813063501329696, "loss": 0.0294, "step": 25820 }, { "epoch": 0.28, "learning_rate": 0.0002581144191476941, "loss": 0.029, "step": 25830 }, { "epoch": 0.28, "learning_rate": 0.0002580982032820912, "loss": 0.0276, "step": 25840 }, { "epoch": 0.28, "learning_rate": 0.00025808198741648827, "loss": 0.0252, "step": 25850 }, { "epoch": 0.28, "learning_rate": 0.00025806577155088533, "loss": 0.0265, "step": 25860 }, { "epoch": 0.28, "learning_rate": 0.00025804955568528245, "loss": 0.0256, "step": 25870 }, { "epoch": 0.28, "learning_rate": 0.00025803333981967957, "loss": 0.0313, "step": 25880 }, { "epoch": 0.28, "learning_rate": 0.00025801712395407664, "loss": 0.0267, "step": 25890 }, { "epoch": 0.28, "learning_rate": 0.00025800090808847376, "loss": 0.0272, "step": 25900 }, { "epoch": 0.28, "learning_rate": 0.0002579846922228708, "loss": 0.0244, "step": 25910 }, { "epoch": 0.28, "learning_rate": 0.00025796847635726794, "loss": 0.0233, "step": 25920 }, { "epoch": 0.28, "learning_rate": 0.000257952260491665, "loss": 0.0215, "step": 25930 }, { "epoch": 0.28, "learning_rate": 0.00025793604462606213, "loss": 0.0247, "step": 25940 }, { "epoch": 0.28, "learning_rate": 0.0002579198287604592, "loss": 0.0214, "step": 25950 }, { "epoch": 0.28, "learning_rate": 0.0002579036128948563, "loss": 0.0236, "step": 25960 }, { "epoch": 0.28, "learning_rate": 0.00025788739702925343, "loss": 0.0249, "step": 25970 }, { "epoch": 0.28, "learning_rate": 0.0002578711811636505, "loss": 0.0248, "step": 25980 }, { "epoch": 0.28, "learning_rate": 0.00025785496529804756, "loss": 0.0227, "step": 25990 }, { "epoch": 0.28, "learning_rate": 0.0002578387494324447, "loss": 0.0267, "step": 26000 }, { "epoch": 0.28, "eval_cer": 0.9215616786273294, "eval_loss": 0.018755970522761345, "eval_runtime": 120.1496, "eval_samples_per_second": 16.646, "eval_steps_per_second": 4.161, "step": 26000 }, { "epoch": 0.28, "learning_rate": 0.0002578225335668418, "loss": 0.0251, "step": 26010 }, { "epoch": 0.28, "learning_rate": 0.00025780631770123887, "loss": 0.0249, "step": 26020 }, { "epoch": 0.28, "learning_rate": 0.00025779010183563594, "loss": 0.0247, "step": 26030 }, { "epoch": 0.28, "learning_rate": 0.00025777388597003306, "loss": 0.0351, "step": 26040 }, { "epoch": 0.28, "learning_rate": 0.0002577576701044302, "loss": 0.0259, "step": 26050 }, { "epoch": 0.28, "learning_rate": 0.00025774145423882724, "loss": 0.0276, "step": 26060 }, { "epoch": 0.28, "learning_rate": 0.0002577252383732243, "loss": 0.0274, "step": 26070 }, { "epoch": 0.28, "learning_rate": 0.0002577090225076214, "loss": 0.0235, "step": 26080 }, { "epoch": 0.28, "learning_rate": 0.00025769280664201855, "loss": 0.0275, "step": 26090 }, { "epoch": 0.28, "learning_rate": 0.0002576765907764156, "loss": 0.0268, "step": 26100 }, { "epoch": 0.28, "learning_rate": 0.00025766037491081273, "loss": 0.0259, "step": 26110 }, { "epoch": 0.28, "learning_rate": 0.0002576441590452098, "loss": 0.0272, "step": 26120 }, { "epoch": 0.28, "learning_rate": 0.0002576279431796069, "loss": 0.0223, "step": 26130 }, { "epoch": 0.28, "learning_rate": 0.00025761172731400404, "loss": 0.0254, "step": 26140 }, { "epoch": 0.28, "learning_rate": 0.0002575955114484011, "loss": 0.0241, "step": 26150 }, { "epoch": 0.28, "learning_rate": 0.00025757929558279817, "loss": 0.0237, "step": 26160 }, { "epoch": 0.28, "learning_rate": 0.0002575630797171953, "loss": 0.025, "step": 26170 }, { "epoch": 0.28, "learning_rate": 0.0002575468638515924, "loss": 0.0225, "step": 26180 }, { "epoch": 0.28, "learning_rate": 0.0002575306479859895, "loss": 0.0248, "step": 26190 }, { "epoch": 0.28, "learning_rate": 0.00025751443212038654, "loss": 0.0234, "step": 26200 }, { "epoch": 0.28, "learning_rate": 0.00025749821625478366, "loss": 0.0257, "step": 26210 }, { "epoch": 0.28, "learning_rate": 0.0002574820003891808, "loss": 0.0234, "step": 26220 }, { "epoch": 0.28, "learning_rate": 0.00025746578452357784, "loss": 0.027, "step": 26230 }, { "epoch": 0.28, "learning_rate": 0.0002574495686579749, "loss": 0.0261, "step": 26240 }, { "epoch": 0.28, "learning_rate": 0.00025743335279237203, "loss": 0.0206, "step": 26250 }, { "epoch": 0.28, "learning_rate": 0.00025741713692676915, "loss": 0.0221, "step": 26260 }, { "epoch": 0.28, "learning_rate": 0.0002574009210611662, "loss": 0.0269, "step": 26270 }, { "epoch": 0.28, "learning_rate": 0.00025738470519556334, "loss": 0.0274, "step": 26280 }, { "epoch": 0.28, "learning_rate": 0.0002573684893299604, "loss": 0.0232, "step": 26290 }, { "epoch": 0.28, "learning_rate": 0.0002573522734643575, "loss": 0.0258, "step": 26300 }, { "epoch": 0.28, "learning_rate": 0.0002573360575987546, "loss": 0.0267, "step": 26310 }, { "epoch": 0.28, "learning_rate": 0.0002573198417331517, "loss": 0.0257, "step": 26320 }, { "epoch": 0.28, "learning_rate": 0.00025730362586754877, "loss": 0.0275, "step": 26330 }, { "epoch": 0.28, "learning_rate": 0.0002572874100019459, "loss": 0.0222, "step": 26340 }, { "epoch": 0.28, "learning_rate": 0.00025727119413634296, "loss": 0.0248, "step": 26350 }, { "epoch": 0.28, "learning_rate": 0.0002572549782707401, "loss": 0.0227, "step": 26360 }, { "epoch": 0.29, "learning_rate": 0.00025723876240513714, "loss": 0.0276, "step": 26370 }, { "epoch": 0.29, "learning_rate": 0.00025722254653953426, "loss": 0.0216, "step": 26380 }, { "epoch": 0.29, "learning_rate": 0.00025720633067393133, "loss": 0.0216, "step": 26390 }, { "epoch": 0.29, "learning_rate": 0.00025719011480832845, "loss": 0.0253, "step": 26400 }, { "epoch": 0.29, "learning_rate": 0.00025717389894272557, "loss": 0.0278, "step": 26410 }, { "epoch": 0.29, "learning_rate": 0.00025715768307712263, "loss": 0.0285, "step": 26420 }, { "epoch": 0.29, "learning_rate": 0.0002571414672115197, "loss": 0.023, "step": 26430 }, { "epoch": 0.29, "learning_rate": 0.0002571252513459168, "loss": 0.0252, "step": 26440 }, { "epoch": 0.29, "learning_rate": 0.00025710903548031394, "loss": 0.0229, "step": 26450 }, { "epoch": 0.29, "learning_rate": 0.000257092819614711, "loss": 0.023, "step": 26460 }, { "epoch": 0.29, "learning_rate": 0.00025707660374910807, "loss": 0.0252, "step": 26470 }, { "epoch": 0.29, "learning_rate": 0.0002570603878835052, "loss": 0.0227, "step": 26480 }, { "epoch": 0.29, "learning_rate": 0.0002570441720179023, "loss": 0.0236, "step": 26490 }, { "epoch": 0.29, "learning_rate": 0.0002570279561522994, "loss": 0.0263, "step": 26500 }, { "epoch": 0.29, "learning_rate": 0.00025701174028669644, "loss": 0.0218, "step": 26510 }, { "epoch": 0.29, "learning_rate": 0.00025699552442109356, "loss": 0.0238, "step": 26520 }, { "epoch": 0.29, "learning_rate": 0.0002569793085554907, "loss": 0.0318, "step": 26530 }, { "epoch": 0.29, "learning_rate": 0.00025696309268988775, "loss": 0.0265, "step": 26540 }, { "epoch": 0.29, "learning_rate": 0.00025694687682428487, "loss": 0.0272, "step": 26550 }, { "epoch": 0.29, "learning_rate": 0.00025693066095868193, "loss": 0.03, "step": 26560 }, { "epoch": 0.29, "learning_rate": 0.00025691444509307905, "loss": 0.0232, "step": 26570 }, { "epoch": 0.29, "learning_rate": 0.00025689822922747617, "loss": 0.0275, "step": 26580 }, { "epoch": 0.29, "learning_rate": 0.00025688201336187324, "loss": 0.022, "step": 26590 }, { "epoch": 0.29, "learning_rate": 0.0002568657974962703, "loss": 0.0226, "step": 26600 }, { "epoch": 0.29, "learning_rate": 0.0002568495816306674, "loss": 0.022, "step": 26610 }, { "epoch": 0.29, "learning_rate": 0.00025683336576506454, "loss": 0.0205, "step": 26620 }, { "epoch": 0.29, "learning_rate": 0.0002568171498994616, "loss": 0.0238, "step": 26630 }, { "epoch": 0.29, "learning_rate": 0.0002568009340338587, "loss": 0.0247, "step": 26640 }, { "epoch": 0.29, "learning_rate": 0.0002567847181682558, "loss": 0.0244, "step": 26650 }, { "epoch": 0.29, "learning_rate": 0.0002567685023026529, "loss": 0.0237, "step": 26660 }, { "epoch": 0.29, "learning_rate": 0.00025675228643705, "loss": 0.0238, "step": 26670 }, { "epoch": 0.29, "learning_rate": 0.00025673607057144705, "loss": 0.0202, "step": 26680 }, { "epoch": 0.29, "learning_rate": 0.00025671985470584417, "loss": 0.021, "step": 26690 }, { "epoch": 0.29, "learning_rate": 0.0002567036388402413, "loss": 0.0244, "step": 26700 }, { "epoch": 0.29, "learning_rate": 0.0002566874229746384, "loss": 0.0269, "step": 26710 }, { "epoch": 0.29, "learning_rate": 0.00025667120710903547, "loss": 0.0263, "step": 26720 }, { "epoch": 0.29, "learning_rate": 0.00025665499124343254, "loss": 0.0287, "step": 26730 }, { "epoch": 0.29, "learning_rate": 0.00025663877537782966, "loss": 0.0214, "step": 26740 }, { "epoch": 0.29, "learning_rate": 0.0002566225595122268, "loss": 0.0286, "step": 26750 }, { "epoch": 0.29, "learning_rate": 0.00025660634364662384, "loss": 0.0279, "step": 26760 }, { "epoch": 0.29, "learning_rate": 0.0002565901277810209, "loss": 0.0235, "step": 26770 }, { "epoch": 0.29, "learning_rate": 0.000256573911915418, "loss": 0.0215, "step": 26780 }, { "epoch": 0.29, "learning_rate": 0.00025655769604981515, "loss": 0.0342, "step": 26790 }, { "epoch": 0.29, "learning_rate": 0.0002565414801842122, "loss": 0.0287, "step": 26800 }, { "epoch": 0.29, "learning_rate": 0.0002565252643186093, "loss": 0.0253, "step": 26810 }, { "epoch": 0.29, "learning_rate": 0.0002565090484530064, "loss": 0.0221, "step": 26820 }, { "epoch": 0.29, "learning_rate": 0.0002564928325874035, "loss": 0.0242, "step": 26830 }, { "epoch": 0.29, "learning_rate": 0.0002564766167218006, "loss": 0.0248, "step": 26840 }, { "epoch": 0.29, "learning_rate": 0.0002564604008561977, "loss": 0.0224, "step": 26850 }, { "epoch": 0.29, "learning_rate": 0.00025644418499059477, "loss": 0.0213, "step": 26860 }, { "epoch": 0.29, "learning_rate": 0.0002564279691249919, "loss": 0.0215, "step": 26870 }, { "epoch": 0.29, "learning_rate": 0.00025641175325938895, "loss": 0.0267, "step": 26880 }, { "epoch": 0.29, "learning_rate": 0.0002563955373937861, "loss": 0.0316, "step": 26890 }, { "epoch": 0.29, "learning_rate": 0.00025637932152818314, "loss": 0.0238, "step": 26900 }, { "epoch": 0.29, "learning_rate": 0.00025636310566258026, "loss": 0.0269, "step": 26910 }, { "epoch": 0.29, "learning_rate": 0.0002563468897969773, "loss": 0.0244, "step": 26920 }, { "epoch": 0.29, "learning_rate": 0.00025633067393137445, "loss": 0.0217, "step": 26930 }, { "epoch": 0.29, "learning_rate": 0.0002563144580657715, "loss": 0.0233, "step": 26940 }, { "epoch": 0.29, "learning_rate": 0.00025629824220016863, "loss": 0.0256, "step": 26950 }, { "epoch": 0.29, "learning_rate": 0.0002562820263345657, "loss": 0.0215, "step": 26960 }, { "epoch": 0.29, "learning_rate": 0.0002562658104689628, "loss": 0.0255, "step": 26970 }, { "epoch": 0.29, "learning_rate": 0.00025624959460335994, "loss": 0.0216, "step": 26980 }, { "epoch": 0.29, "learning_rate": 0.000256233378737757, "loss": 0.0233, "step": 26990 }, { "epoch": 0.29, "learning_rate": 0.00025621716287215407, "loss": 0.0245, "step": 27000 }, { "epoch": 0.29, "eval_cer": 0.9215590728184603, "eval_loss": 0.017664359882473946, "eval_runtime": 120.4378, "eval_samples_per_second": 16.606, "eval_steps_per_second": 4.152, "step": 27000 }, { "epoch": 0.29, "learning_rate": 0.0002562009470065512, "loss": 0.0323, "step": 27010 }, { "epoch": 0.29, "learning_rate": 0.0002561847311409483, "loss": 0.0263, "step": 27020 }, { "epoch": 0.29, "learning_rate": 0.00025616851527534537, "loss": 0.0228, "step": 27030 }, { "epoch": 0.29, "learning_rate": 0.00025615229940974244, "loss": 0.0333, "step": 27040 }, { "epoch": 0.29, "learning_rate": 0.00025613608354413956, "loss": 0.0262, "step": 27050 }, { "epoch": 0.29, "learning_rate": 0.0002561198676785367, "loss": 0.0223, "step": 27060 }, { "epoch": 0.29, "learning_rate": 0.00025610365181293374, "loss": 0.0242, "step": 27070 }, { "epoch": 0.29, "learning_rate": 0.0002560874359473308, "loss": 0.0293, "step": 27080 }, { "epoch": 0.29, "learning_rate": 0.00025607122008172793, "loss": 0.0271, "step": 27090 }, { "epoch": 0.29, "learning_rate": 0.00025605500421612505, "loss": 0.0202, "step": 27100 }, { "epoch": 0.29, "learning_rate": 0.0002560387883505221, "loss": 0.0247, "step": 27110 }, { "epoch": 0.29, "learning_rate": 0.00025602257248491923, "loss": 0.0321, "step": 27120 }, { "epoch": 0.29, "learning_rate": 0.0002560063566193163, "loss": 0.0203, "step": 27130 }, { "epoch": 0.29, "learning_rate": 0.0002559901407537134, "loss": 0.0247, "step": 27140 }, { "epoch": 0.29, "learning_rate": 0.00025597392488811054, "loss": 0.0242, "step": 27150 }, { "epoch": 0.29, "learning_rate": 0.0002559577090225076, "loss": 0.027, "step": 27160 }, { "epoch": 0.29, "learning_rate": 0.00025594149315690467, "loss": 0.0283, "step": 27170 }, { "epoch": 0.29, "learning_rate": 0.0002559252772913018, "loss": 0.0251, "step": 27180 }, { "epoch": 0.29, "learning_rate": 0.0002559090614256989, "loss": 0.0242, "step": 27190 }, { "epoch": 0.29, "learning_rate": 0.000255892845560096, "loss": 0.0212, "step": 27200 }, { "epoch": 0.29, "learning_rate": 0.00025587662969449304, "loss": 0.0241, "step": 27210 }, { "epoch": 0.29, "learning_rate": 0.00025586041382889016, "loss": 0.025, "step": 27220 }, { "epoch": 0.29, "learning_rate": 0.0002558441979632873, "loss": 0.0254, "step": 27230 }, { "epoch": 0.29, "learning_rate": 0.00025582798209768435, "loss": 0.0288, "step": 27240 }, { "epoch": 0.29, "learning_rate": 0.0002558117662320814, "loss": 0.0271, "step": 27250 }, { "epoch": 0.29, "learning_rate": 0.00025579555036647853, "loss": 0.0226, "step": 27260 }, { "epoch": 0.29, "learning_rate": 0.00025577933450087565, "loss": 0.026, "step": 27270 }, { "epoch": 0.29, "learning_rate": 0.0002557631186352727, "loss": 0.0226, "step": 27280 }, { "epoch": 0.3, "learning_rate": 0.00025574690276966984, "loss": 0.0251, "step": 27290 }, { "epoch": 0.3, "learning_rate": 0.0002557306869040669, "loss": 0.0262, "step": 27300 }, { "epoch": 0.3, "learning_rate": 0.000255714471038464, "loss": 0.0222, "step": 27310 }, { "epoch": 0.3, "learning_rate": 0.0002556982551728611, "loss": 0.0232, "step": 27320 }, { "epoch": 0.3, "learning_rate": 0.0002556820393072582, "loss": 0.0246, "step": 27330 }, { "epoch": 0.3, "learning_rate": 0.0002556658234416553, "loss": 0.0257, "step": 27340 }, { "epoch": 0.3, "learning_rate": 0.0002556496075760524, "loss": 0.0235, "step": 27350 }, { "epoch": 0.3, "learning_rate": 0.0002556333917104495, "loss": 0.0239, "step": 27360 }, { "epoch": 0.3, "learning_rate": 0.0002556171758448466, "loss": 0.0233, "step": 27370 }, { "epoch": 0.3, "learning_rate": 0.00025560095997924365, "loss": 0.0227, "step": 27380 }, { "epoch": 0.3, "learning_rate": 0.00025558474411364077, "loss": 0.0265, "step": 27390 }, { "epoch": 0.3, "learning_rate": 0.0002555685282480379, "loss": 0.0242, "step": 27400 }, { "epoch": 0.3, "learning_rate": 0.00025555231238243495, "loss": 0.0227, "step": 27410 }, { "epoch": 0.3, "learning_rate": 0.00025553609651683207, "loss": 0.0225, "step": 27420 }, { "epoch": 0.3, "learning_rate": 0.00025551988065122914, "loss": 0.0227, "step": 27430 }, { "epoch": 0.3, "learning_rate": 0.00025550366478562626, "loss": 0.0249, "step": 27440 }, { "epoch": 0.3, "learning_rate": 0.0002554874489200233, "loss": 0.0255, "step": 27450 }, { "epoch": 0.3, "learning_rate": 0.00025547123305442044, "loss": 0.0302, "step": 27460 }, { "epoch": 0.3, "learning_rate": 0.0002554550171888175, "loss": 0.024, "step": 27470 }, { "epoch": 0.3, "learning_rate": 0.00025543880132321463, "loss": 0.0228, "step": 27480 }, { "epoch": 0.3, "learning_rate": 0.0002554225854576117, "loss": 0.0266, "step": 27490 }, { "epoch": 0.3, "learning_rate": 0.0002554063695920088, "loss": 0.0254, "step": 27500 }, { "epoch": 0.3, "learning_rate": 0.0002553901537264059, "loss": 0.0244, "step": 27510 }, { "epoch": 0.3, "learning_rate": 0.000255373937860803, "loss": 0.0232, "step": 27520 }, { "epoch": 0.3, "learning_rate": 0.00025535772199520006, "loss": 0.029, "step": 27530 }, { "epoch": 0.3, "learning_rate": 0.0002553415061295972, "loss": 0.027, "step": 27540 }, { "epoch": 0.3, "learning_rate": 0.00025532529026399425, "loss": 0.0252, "step": 27550 }, { "epoch": 0.3, "learning_rate": 0.00025530907439839137, "loss": 0.0227, "step": 27560 }, { "epoch": 0.3, "learning_rate": 0.00025529285853278844, "loss": 0.0267, "step": 27570 }, { "epoch": 0.3, "learning_rate": 0.00025527664266718555, "loss": 0.0244, "step": 27580 }, { "epoch": 0.3, "learning_rate": 0.0002552604268015827, "loss": 0.0238, "step": 27590 }, { "epoch": 0.3, "learning_rate": 0.00025524421093597974, "loss": 0.0246, "step": 27600 }, { "epoch": 0.3, "learning_rate": 0.0002552279950703768, "loss": 0.025, "step": 27610 }, { "epoch": 0.3, "learning_rate": 0.0002552117792047739, "loss": 0.0227, "step": 27620 }, { "epoch": 0.3, "learning_rate": 0.00025519556333917105, "loss": 0.0232, "step": 27630 }, { "epoch": 0.3, "learning_rate": 0.0002551793474735681, "loss": 0.0238, "step": 27640 }, { "epoch": 0.3, "learning_rate": 0.0002551631316079652, "loss": 0.0234, "step": 27650 }, { "epoch": 0.3, "learning_rate": 0.0002551469157423623, "loss": 0.0238, "step": 27660 }, { "epoch": 0.3, "learning_rate": 0.0002551306998767594, "loss": 0.024, "step": 27670 }, { "epoch": 0.3, "learning_rate": 0.0002551144840111565, "loss": 0.0281, "step": 27680 }, { "epoch": 0.3, "learning_rate": 0.00025509826814555355, "loss": 0.0207, "step": 27690 }, { "epoch": 0.3, "learning_rate": 0.00025508205227995067, "loss": 0.0234, "step": 27700 }, { "epoch": 0.3, "learning_rate": 0.0002550658364143478, "loss": 0.0245, "step": 27710 }, { "epoch": 0.3, "learning_rate": 0.0002550496205487449, "loss": 0.0264, "step": 27720 }, { "epoch": 0.3, "learning_rate": 0.000255033404683142, "loss": 0.026, "step": 27730 }, { "epoch": 0.3, "learning_rate": 0.00025501718881753904, "loss": 0.0231, "step": 27740 }, { "epoch": 0.3, "learning_rate": 0.00025500097295193616, "loss": 0.0187, "step": 27750 }, { "epoch": 0.3, "learning_rate": 0.0002549847570863333, "loss": 0.0244, "step": 27760 }, { "epoch": 0.3, "learning_rate": 0.00025496854122073034, "loss": 0.0238, "step": 27770 }, { "epoch": 0.3, "learning_rate": 0.0002549523253551274, "loss": 0.0228, "step": 27780 }, { "epoch": 0.3, "learning_rate": 0.00025493610948952453, "loss": 0.022, "step": 27790 }, { "epoch": 0.3, "learning_rate": 0.00025491989362392165, "loss": 0.0254, "step": 27800 }, { "epoch": 0.3, "learning_rate": 0.0002549036777583187, "loss": 0.0215, "step": 27810 }, { "epoch": 0.3, "learning_rate": 0.0002548874618927158, "loss": 0.0284, "step": 27820 }, { "epoch": 0.3, "learning_rate": 0.0002548712460271129, "loss": 0.0236, "step": 27830 }, { "epoch": 0.3, "learning_rate": 0.00025485503016151, "loss": 0.0243, "step": 27840 }, { "epoch": 0.3, "learning_rate": 0.0002548388142959071, "loss": 0.0248, "step": 27850 }, { "epoch": 0.3, "learning_rate": 0.0002548225984303042, "loss": 0.0246, "step": 27860 }, { "epoch": 0.3, "learning_rate": 0.00025480638256470127, "loss": 0.0272, "step": 27870 }, { "epoch": 0.3, "learning_rate": 0.0002547901666990984, "loss": 0.0238, "step": 27880 }, { "epoch": 0.3, "learning_rate": 0.00025477395083349546, "loss": 0.0222, "step": 27890 }, { "epoch": 0.3, "learning_rate": 0.0002547577349678926, "loss": 0.0243, "step": 27900 }, { "epoch": 0.3, "learning_rate": 0.00025474151910228964, "loss": 0.0211, "step": 27910 }, { "epoch": 0.3, "learning_rate": 0.00025472530323668676, "loss": 0.0344, "step": 27920 }, { "epoch": 0.3, "learning_rate": 0.00025470908737108383, "loss": 0.0302, "step": 27930 }, { "epoch": 0.3, "learning_rate": 0.00025469287150548095, "loss": 0.0305, "step": 27940 }, { "epoch": 0.3, "learning_rate": 0.000254676655639878, "loss": 0.0264, "step": 27950 }, { "epoch": 0.3, "learning_rate": 0.00025466043977427513, "loss": 0.0285, "step": 27960 }, { "epoch": 0.3, "learning_rate": 0.0002546442239086722, "loss": 0.027, "step": 27970 }, { "epoch": 0.3, "learning_rate": 0.0002546280080430693, "loss": 0.0242, "step": 27980 }, { "epoch": 0.3, "learning_rate": 0.00025461179217746644, "loss": 0.0231, "step": 27990 }, { "epoch": 0.3, "learning_rate": 0.0002545955763118635, "loss": 0.0258, "step": 28000 }, { "epoch": 0.3, "eval_cer": 0.9215990285544536, "eval_loss": 0.01768692582845688, "eval_runtime": 120.5374, "eval_samples_per_second": 16.592, "eval_steps_per_second": 4.148, "step": 28000 }, { "epoch": 0.3, "learning_rate": 0.00025457936044626057, "loss": 0.0224, "step": 28010 }, { "epoch": 0.3, "learning_rate": 0.0002545631445806577, "loss": 0.0234, "step": 28020 }, { "epoch": 0.3, "learning_rate": 0.0002545469287150548, "loss": 0.0229, "step": 28030 }, { "epoch": 0.3, "learning_rate": 0.0002545307128494519, "loss": 0.0302, "step": 28040 }, { "epoch": 0.3, "learning_rate": 0.00025451449698384894, "loss": 0.027, "step": 28050 }, { "epoch": 0.3, "learning_rate": 0.00025449828111824606, "loss": 0.0256, "step": 28060 }, { "epoch": 0.3, "learning_rate": 0.0002544820652526432, "loss": 0.024, "step": 28070 }, { "epoch": 0.3, "learning_rate": 0.00025446584938704025, "loss": 0.0242, "step": 28080 }, { "epoch": 0.3, "learning_rate": 0.00025444963352143737, "loss": 0.0275, "step": 28090 }, { "epoch": 0.3, "learning_rate": 0.00025443341765583443, "loss": 0.0264, "step": 28100 }, { "epoch": 0.3, "learning_rate": 0.00025441720179023155, "loss": 0.0206, "step": 28110 }, { "epoch": 0.3, "learning_rate": 0.0002544009859246286, "loss": 0.0263, "step": 28120 }, { "epoch": 0.3, "learning_rate": 0.00025438477005902574, "loss": 0.0239, "step": 28130 }, { "epoch": 0.3, "learning_rate": 0.0002543685541934228, "loss": 0.0221, "step": 28140 }, { "epoch": 0.3, "learning_rate": 0.0002543523383278199, "loss": 0.0245, "step": 28150 }, { "epoch": 0.3, "learning_rate": 0.00025433612246221704, "loss": 0.0232, "step": 28160 }, { "epoch": 0.3, "learning_rate": 0.0002543199065966141, "loss": 0.0194, "step": 28170 }, { "epoch": 0.3, "learning_rate": 0.0002543036907310112, "loss": 0.0218, "step": 28180 }, { "epoch": 0.3, "learning_rate": 0.0002542874748654083, "loss": 0.0199, "step": 28190 }, { "epoch": 0.3, "learning_rate": 0.0002542712589998054, "loss": 0.0292, "step": 28200 }, { "epoch": 0.3, "learning_rate": 0.0002542550431342025, "loss": 0.0257, "step": 28210 }, { "epoch": 0.31, "learning_rate": 0.00025423882726859954, "loss": 0.0268, "step": 28220 }, { "epoch": 0.31, "learning_rate": 0.00025422261140299666, "loss": 0.0231, "step": 28230 }, { "epoch": 0.31, "learning_rate": 0.0002542063955373938, "loss": 0.022, "step": 28240 }, { "epoch": 0.31, "learning_rate": 0.00025419017967179085, "loss": 0.0302, "step": 28250 }, { "epoch": 0.31, "learning_rate": 0.0002541739638061879, "loss": 0.0251, "step": 28260 }, { "epoch": 0.31, "learning_rate": 0.00025415774794058504, "loss": 0.0253, "step": 28270 }, { "epoch": 0.31, "learning_rate": 0.00025414153207498216, "loss": 0.0231, "step": 28280 }, { "epoch": 0.31, "learning_rate": 0.0002541253162093793, "loss": 0.0259, "step": 28290 }, { "epoch": 0.31, "learning_rate": 0.00025410910034377634, "loss": 0.0208, "step": 28300 }, { "epoch": 0.31, "learning_rate": 0.0002540928844781734, "loss": 0.0217, "step": 28310 }, { "epoch": 0.31, "learning_rate": 0.0002540766686125705, "loss": 0.0226, "step": 28320 }, { "epoch": 0.31, "learning_rate": 0.00025406045274696765, "loss": 0.0217, "step": 28330 }, { "epoch": 0.31, "learning_rate": 0.0002540442368813647, "loss": 0.0221, "step": 28340 }, { "epoch": 0.31, "learning_rate": 0.0002540280210157618, "loss": 0.0255, "step": 28350 }, { "epoch": 0.31, "learning_rate": 0.0002540118051501589, "loss": 0.0233, "step": 28360 }, { "epoch": 0.31, "learning_rate": 0.000253995589284556, "loss": 0.0213, "step": 28370 }, { "epoch": 0.31, "learning_rate": 0.0002539793734189531, "loss": 0.0238, "step": 28380 }, { "epoch": 0.31, "learning_rate": 0.00025396315755335015, "loss": 0.0194, "step": 28390 }, { "epoch": 0.31, "learning_rate": 0.00025394694168774727, "loss": 0.024, "step": 28400 }, { "epoch": 0.31, "learning_rate": 0.0002539307258221444, "loss": 0.0213, "step": 28410 }, { "epoch": 0.31, "learning_rate": 0.00025391450995654145, "loss": 0.0203, "step": 28420 }, { "epoch": 0.31, "learning_rate": 0.0002538982940909386, "loss": 0.0223, "step": 28430 }, { "epoch": 0.31, "learning_rate": 0.00025388207822533564, "loss": 0.019, "step": 28440 }, { "epoch": 0.31, "learning_rate": 0.00025386586235973276, "loss": 0.0208, "step": 28450 }, { "epoch": 0.31, "learning_rate": 0.0002538496464941298, "loss": 0.0228, "step": 28460 }, { "epoch": 0.31, "learning_rate": 0.00025383343062852694, "loss": 0.0227, "step": 28470 }, { "epoch": 0.31, "learning_rate": 0.000253817214762924, "loss": 0.0239, "step": 28480 }, { "epoch": 0.31, "learning_rate": 0.00025380099889732113, "loss": 0.0243, "step": 28490 }, { "epoch": 0.31, "learning_rate": 0.0002537847830317182, "loss": 0.0226, "step": 28500 }, { "epoch": 0.31, "learning_rate": 0.0002537685671661153, "loss": 0.0222, "step": 28510 }, { "epoch": 0.31, "learning_rate": 0.0002537523513005124, "loss": 0.021, "step": 28520 }, { "epoch": 0.31, "learning_rate": 0.0002537361354349095, "loss": 0.0228, "step": 28530 }, { "epoch": 0.31, "learning_rate": 0.00025371991956930657, "loss": 0.0229, "step": 28540 }, { "epoch": 0.31, "learning_rate": 0.0002537037037037037, "loss": 0.0253, "step": 28550 }, { "epoch": 0.31, "learning_rate": 0.00025368748783810075, "loss": 0.0227, "step": 28560 }, { "epoch": 0.31, "learning_rate": 0.00025367127197249787, "loss": 0.025, "step": 28570 }, { "epoch": 0.31, "learning_rate": 0.00025365505610689494, "loss": 0.0224, "step": 28580 }, { "epoch": 0.31, "learning_rate": 0.00025363884024129206, "loss": 0.0257, "step": 28590 }, { "epoch": 0.31, "learning_rate": 0.0002536226243756892, "loss": 0.0244, "step": 28600 }, { "epoch": 0.31, "learning_rate": 0.00025360640851008624, "loss": 0.0219, "step": 28610 }, { "epoch": 0.31, "learning_rate": 0.0002535901926444833, "loss": 0.0239, "step": 28620 }, { "epoch": 0.31, "learning_rate": 0.00025357397677888043, "loss": 0.022, "step": 28630 }, { "epoch": 0.31, "learning_rate": 0.00025355776091327755, "loss": 0.0272, "step": 28640 }, { "epoch": 0.31, "learning_rate": 0.0002535415450476746, "loss": 0.0231, "step": 28650 }, { "epoch": 0.31, "learning_rate": 0.0002535253291820717, "loss": 0.0249, "step": 28660 }, { "epoch": 0.31, "learning_rate": 0.0002535091133164688, "loss": 0.0235, "step": 28670 }, { "epoch": 0.31, "learning_rate": 0.0002534928974508659, "loss": 0.023, "step": 28680 }, { "epoch": 0.31, "learning_rate": 0.000253476681585263, "loss": 0.0306, "step": 28690 }, { "epoch": 0.31, "learning_rate": 0.00025346046571966005, "loss": 0.0278, "step": 28700 }, { "epoch": 0.31, "learning_rate": 0.00025344424985405717, "loss": 0.0238, "step": 28710 }, { "epoch": 0.31, "learning_rate": 0.0002534280339884543, "loss": 0.026, "step": 28720 }, { "epoch": 0.31, "learning_rate": 0.0002534118181228514, "loss": 0.0243, "step": 28730 }, { "epoch": 0.31, "learning_rate": 0.0002533956022572485, "loss": 0.0237, "step": 28740 }, { "epoch": 0.31, "learning_rate": 0.00025337938639164554, "loss": 0.029, "step": 28750 }, { "epoch": 0.31, "learning_rate": 0.00025336317052604266, "loss": 0.0206, "step": 28760 }, { "epoch": 0.31, "learning_rate": 0.0002533469546604398, "loss": 0.0276, "step": 28770 }, { "epoch": 0.31, "learning_rate": 0.00025333073879483685, "loss": 0.0289, "step": 28780 }, { "epoch": 0.31, "learning_rate": 0.0002533145229292339, "loss": 0.0208, "step": 28790 }, { "epoch": 0.31, "learning_rate": 0.00025329830706363103, "loss": 0.0228, "step": 28800 }, { "epoch": 0.31, "learning_rate": 0.00025328209119802815, "loss": 0.0253, "step": 28810 }, { "epoch": 0.31, "learning_rate": 0.0002532658753324252, "loss": 0.02, "step": 28820 }, { "epoch": 0.31, "learning_rate": 0.0002532496594668223, "loss": 0.0223, "step": 28830 }, { "epoch": 0.31, "learning_rate": 0.0002532334436012194, "loss": 0.0265, "step": 28840 }, { "epoch": 0.31, "learning_rate": 0.0002532172277356165, "loss": 0.0283, "step": 28850 }, { "epoch": 0.31, "learning_rate": 0.0002532010118700136, "loss": 0.0247, "step": 28860 }, { "epoch": 0.31, "learning_rate": 0.0002531847960044107, "loss": 0.0241, "step": 28870 }, { "epoch": 0.31, "learning_rate": 0.0002531685801388078, "loss": 0.024, "step": 28880 }, { "epoch": 0.31, "learning_rate": 0.0002531523642732049, "loss": 0.0229, "step": 28890 }, { "epoch": 0.31, "learning_rate": 0.000253136148407602, "loss": 0.0226, "step": 28900 }, { "epoch": 0.31, "learning_rate": 0.0002531199325419991, "loss": 0.0231, "step": 28910 }, { "epoch": 0.31, "learning_rate": 0.00025310371667639615, "loss": 0.0211, "step": 28920 }, { "epoch": 0.31, "learning_rate": 0.00025308750081079326, "loss": 0.0226, "step": 28930 }, { "epoch": 0.31, "learning_rate": 0.0002530712849451904, "loss": 0.0237, "step": 28940 }, { "epoch": 0.31, "learning_rate": 0.00025305506907958745, "loss": 0.0249, "step": 28950 }, { "epoch": 0.31, "learning_rate": 0.0002530388532139845, "loss": 0.0279, "step": 28960 }, { "epoch": 0.31, "learning_rate": 0.00025302263734838164, "loss": 0.0246, "step": 28970 }, { "epoch": 0.31, "learning_rate": 0.00025300642148277876, "loss": 0.0193, "step": 28980 }, { "epoch": 0.31, "learning_rate": 0.0002529902056171758, "loss": 0.0246, "step": 28990 }, { "epoch": 0.31, "learning_rate": 0.0002529739897515729, "loss": 0.0235, "step": 29000 }, { "epoch": 0.31, "eval_cer": 0.9215694960539368, "eval_loss": 0.01686452515423298, "eval_runtime": 121.6905, "eval_samples_per_second": 16.435, "eval_steps_per_second": 4.109, "step": 29000 }, { "epoch": 0.31, "learning_rate": 0.00025295777388597, "loss": 0.0236, "step": 29010 }, { "epoch": 0.31, "learning_rate": 0.0002529415580203671, "loss": 0.0204, "step": 29020 }, { "epoch": 0.31, "learning_rate": 0.0002529253421547642, "loss": 0.024, "step": 29030 }, { "epoch": 0.31, "learning_rate": 0.0002529091262891613, "loss": 0.0247, "step": 29040 }, { "epoch": 0.31, "learning_rate": 0.0002528929104235584, "loss": 0.0236, "step": 29050 }, { "epoch": 0.31, "learning_rate": 0.0002528766945579555, "loss": 0.0209, "step": 29060 }, { "epoch": 0.31, "learning_rate": 0.00025286047869235256, "loss": 0.023, "step": 29070 }, { "epoch": 0.31, "learning_rate": 0.0002528442628267497, "loss": 0.0229, "step": 29080 }, { "epoch": 0.31, "learning_rate": 0.00025282804696114675, "loss": 0.0197, "step": 29090 }, { "epoch": 0.31, "learning_rate": 0.00025281183109554387, "loss": 0.0234, "step": 29100 }, { "epoch": 0.31, "learning_rate": 0.00025279561522994093, "loss": 0.0227, "step": 29110 }, { "epoch": 0.31, "learning_rate": 0.00025277939936433805, "loss": 0.0204, "step": 29120 }, { "epoch": 0.31, "learning_rate": 0.0002527631834987351, "loss": 0.024, "step": 29130 }, { "epoch": 0.32, "learning_rate": 0.00025274696763313224, "loss": 0.0214, "step": 29140 }, { "epoch": 0.32, "learning_rate": 0.0002527307517675293, "loss": 0.0235, "step": 29150 }, { "epoch": 0.32, "learning_rate": 0.0002527145359019264, "loss": 0.0208, "step": 29160 }, { "epoch": 0.32, "learning_rate": 0.00025269832003632355, "loss": 0.0229, "step": 29170 }, { "epoch": 0.32, "learning_rate": 0.0002526821041707206, "loss": 0.0262, "step": 29180 }, { "epoch": 0.32, "learning_rate": 0.0002526658883051177, "loss": 0.0243, "step": 29190 }, { "epoch": 0.32, "learning_rate": 0.0002526496724395148, "loss": 0.021, "step": 29200 }, { "epoch": 0.32, "learning_rate": 0.0002526334565739119, "loss": 0.0209, "step": 29210 }, { "epoch": 0.32, "learning_rate": 0.000252617240708309, "loss": 0.0252, "step": 29220 }, { "epoch": 0.32, "learning_rate": 0.00025260102484270605, "loss": 0.0231, "step": 29230 }, { "epoch": 0.32, "learning_rate": 0.00025258480897710317, "loss": 0.0228, "step": 29240 }, { "epoch": 0.32, "learning_rate": 0.0002525685931115003, "loss": 0.0241, "step": 29250 }, { "epoch": 0.32, "learning_rate": 0.00025255237724589735, "loss": 0.0229, "step": 29260 }, { "epoch": 0.32, "learning_rate": 0.0002525361613802944, "loss": 0.0234, "step": 29270 }, { "epoch": 0.32, "learning_rate": 0.00025251994551469154, "loss": 0.022, "step": 29280 }, { "epoch": 0.32, "learning_rate": 0.00025250372964908866, "loss": 0.0234, "step": 29290 }, { "epoch": 0.32, "learning_rate": 0.0002524875137834858, "loss": 0.0225, "step": 29300 }, { "epoch": 0.32, "learning_rate": 0.00025247129791788284, "loss": 0.0217, "step": 29310 }, { "epoch": 0.32, "learning_rate": 0.0002524550820522799, "loss": 0.0253, "step": 29320 }, { "epoch": 0.32, "learning_rate": 0.00025243886618667703, "loss": 0.0198, "step": 29330 }, { "epoch": 0.32, "learning_rate": 0.00025242265032107415, "loss": 0.0283, "step": 29340 }, { "epoch": 0.32, "learning_rate": 0.0002524064344554712, "loss": 0.0262, "step": 29350 }, { "epoch": 0.32, "learning_rate": 0.0002523902185898683, "loss": 0.0259, "step": 29360 }, { "epoch": 0.32, "learning_rate": 0.0002523740027242654, "loss": 0.0261, "step": 29370 }, { "epoch": 0.32, "learning_rate": 0.0002523577868586625, "loss": 0.0219, "step": 29380 }, { "epoch": 0.32, "learning_rate": 0.0002523415709930596, "loss": 0.0257, "step": 29390 }, { "epoch": 0.32, "learning_rate": 0.00025232535512745665, "loss": 0.0225, "step": 29400 }, { "epoch": 0.32, "learning_rate": 0.00025230913926185377, "loss": 0.0264, "step": 29410 }, { "epoch": 0.32, "learning_rate": 0.0002522929233962509, "loss": 0.0252, "step": 29420 }, { "epoch": 0.32, "learning_rate": 0.00025227670753064796, "loss": 0.0259, "step": 29430 }, { "epoch": 0.32, "learning_rate": 0.0002522604916650451, "loss": 0.0263, "step": 29440 }, { "epoch": 0.32, "learning_rate": 0.00025224427579944214, "loss": 0.0268, "step": 29450 }, { "epoch": 0.32, "learning_rate": 0.00025222805993383926, "loss": 0.0236, "step": 29460 }, { "epoch": 0.32, "learning_rate": 0.00025221184406823633, "loss": 0.0212, "step": 29470 }, { "epoch": 0.32, "learning_rate": 0.00025219562820263345, "loss": 0.0223, "step": 29480 }, { "epoch": 0.32, "learning_rate": 0.0002521794123370305, "loss": 0.0262, "step": 29490 }, { "epoch": 0.32, "learning_rate": 0.00025216319647142763, "loss": 0.0242, "step": 29500 }, { "epoch": 0.32, "learning_rate": 0.00025214698060582475, "loss": 0.0245, "step": 29510 }, { "epoch": 0.32, "learning_rate": 0.0002521307647402218, "loss": 0.0253, "step": 29520 }, { "epoch": 0.32, "learning_rate": 0.0002521145488746189, "loss": 0.0236, "step": 29530 }, { "epoch": 0.32, "learning_rate": 0.000252098333009016, "loss": 0.0266, "step": 29540 }, { "epoch": 0.32, "learning_rate": 0.0002520821171434131, "loss": 0.0239, "step": 29550 }, { "epoch": 0.32, "learning_rate": 0.0002520659012778102, "loss": 0.02, "step": 29560 }, { "epoch": 0.32, "learning_rate": 0.00025204968541220725, "loss": 0.0233, "step": 29570 }, { "epoch": 0.32, "learning_rate": 0.0002520334695466044, "loss": 0.0213, "step": 29580 }, { "epoch": 0.32, "learning_rate": 0.0002520172536810015, "loss": 0.021, "step": 29590 }, { "epoch": 0.32, "learning_rate": 0.00025200103781539856, "loss": 0.0247, "step": 29600 }, { "epoch": 0.32, "learning_rate": 0.0002519848219497957, "loss": 0.0248, "step": 29610 }, { "epoch": 0.32, "learning_rate": 0.00025196860608419275, "loss": 0.0241, "step": 29620 }, { "epoch": 0.32, "learning_rate": 0.00025195239021858987, "loss": 0.0205, "step": 29630 }, { "epoch": 0.32, "learning_rate": 0.00025193617435298693, "loss": 0.0197, "step": 29640 }, { "epoch": 0.32, "learning_rate": 0.00025191995848738405, "loss": 0.0233, "step": 29650 }, { "epoch": 0.32, "learning_rate": 0.0002519037426217811, "loss": 0.0241, "step": 29660 }, { "epoch": 0.32, "learning_rate": 0.00025188752675617824, "loss": 0.0192, "step": 29670 }, { "epoch": 0.32, "learning_rate": 0.0002518713108905753, "loss": 0.0229, "step": 29680 }, { "epoch": 0.32, "learning_rate": 0.0002518550950249724, "loss": 0.0285, "step": 29690 }, { "epoch": 0.32, "learning_rate": 0.0002518388791593695, "loss": 0.023, "step": 29700 }, { "epoch": 0.32, "learning_rate": 0.0002518226632937666, "loss": 0.0237, "step": 29710 }, { "epoch": 0.32, "learning_rate": 0.0002518064474281637, "loss": 0.0265, "step": 29720 }, { "epoch": 0.32, "learning_rate": 0.0002517902315625608, "loss": 0.0227, "step": 29730 }, { "epoch": 0.32, "learning_rate": 0.0002517740156969579, "loss": 0.0285, "step": 29740 }, { "epoch": 0.32, "learning_rate": 0.000251757799831355, "loss": 0.0209, "step": 29750 }, { "epoch": 0.32, "learning_rate": 0.00025174158396575204, "loss": 0.022, "step": 29760 }, { "epoch": 0.32, "learning_rate": 0.00025172536810014916, "loss": 0.0222, "step": 29770 }, { "epoch": 0.32, "learning_rate": 0.0002517091522345463, "loss": 0.0248, "step": 29780 }, { "epoch": 0.32, "learning_rate": 0.00025169293636894335, "loss": 0.0295, "step": 29790 }, { "epoch": 0.32, "learning_rate": 0.0002516767205033404, "loss": 0.0279, "step": 29800 }, { "epoch": 0.32, "learning_rate": 0.00025166050463773753, "loss": 0.0229, "step": 29810 }, { "epoch": 0.32, "learning_rate": 0.00025164428877213465, "loss": 0.0222, "step": 29820 }, { "epoch": 0.32, "learning_rate": 0.0002516280729065317, "loss": 0.0251, "step": 29830 }, { "epoch": 0.32, "learning_rate": 0.0002516118570409288, "loss": 0.0237, "step": 29840 }, { "epoch": 0.32, "learning_rate": 0.0002515956411753259, "loss": 0.0264, "step": 29850 }, { "epoch": 0.32, "learning_rate": 0.000251579425309723, "loss": 0.0267, "step": 29860 }, { "epoch": 0.32, "learning_rate": 0.0002515632094441201, "loss": 0.0249, "step": 29870 }, { "epoch": 0.32, "learning_rate": 0.0002515469935785172, "loss": 0.0235, "step": 29880 }, { "epoch": 0.32, "learning_rate": 0.0002515307777129143, "loss": 0.0236, "step": 29890 }, { "epoch": 0.32, "learning_rate": 0.0002515145618473114, "loss": 0.0239, "step": 29900 }, { "epoch": 0.32, "learning_rate": 0.0002514983459817085, "loss": 0.023, "step": 29910 }, { "epoch": 0.32, "learning_rate": 0.0002514821301161056, "loss": 0.0282, "step": 29920 }, { "epoch": 0.32, "learning_rate": 0.00025146591425050265, "loss": 0.0281, "step": 29930 }, { "epoch": 0.32, "learning_rate": 0.00025144969838489977, "loss": 0.0252, "step": 29940 }, { "epoch": 0.32, "learning_rate": 0.0002514334825192969, "loss": 0.0278, "step": 29950 }, { "epoch": 0.32, "learning_rate": 0.00025141726665369395, "loss": 0.0237, "step": 29960 }, { "epoch": 0.32, "learning_rate": 0.000251401050788091, "loss": 0.0241, "step": 29970 }, { "epoch": 0.32, "learning_rate": 0.00025138483492248814, "loss": 0.0267, "step": 29980 }, { "epoch": 0.32, "learning_rate": 0.00025136861905688526, "loss": 0.0225, "step": 29990 }, { "epoch": 0.32, "learning_rate": 0.0002513524031912823, "loss": 0.0235, "step": 30000 }, { "epoch": 0.32, "eval_cer": 0.921567758848024, "eval_loss": 0.017599964514374733, "eval_runtime": 121.9748, "eval_samples_per_second": 16.397, "eval_steps_per_second": 4.099, "step": 30000 }, { "epoch": 0.32, "learning_rate": 0.0002513361873256794, "loss": 0.0246, "step": 30010 }, { "epoch": 0.32, "learning_rate": 0.0002513199714600765, "loss": 0.0224, "step": 30020 }, { "epoch": 0.32, "learning_rate": 0.00025130375559447363, "loss": 0.02, "step": 30030 }, { "epoch": 0.32, "learning_rate": 0.0002512875397288707, "loss": 0.0216, "step": 30040 }, { "epoch": 0.32, "learning_rate": 0.0002512713238632678, "loss": 0.0285, "step": 30050 }, { "epoch": 0.32, "learning_rate": 0.0002512551079976649, "loss": 0.021, "step": 30060 }, { "epoch": 0.33, "learning_rate": 0.000251238892132062, "loss": 0.019, "step": 30070 }, { "epoch": 0.33, "learning_rate": 0.00025122267626645907, "loss": 0.0263, "step": 30080 }, { "epoch": 0.33, "learning_rate": 0.0002512064604008562, "loss": 0.0234, "step": 30090 }, { "epoch": 0.33, "learning_rate": 0.00025119024453525325, "loss": 0.0274, "step": 30100 }, { "epoch": 0.33, "learning_rate": 0.00025117402866965037, "loss": 0.0233, "step": 30110 }, { "epoch": 0.33, "learning_rate": 0.00025115781280404744, "loss": 0.0223, "step": 30120 }, { "epoch": 0.33, "learning_rate": 0.00025114159693844456, "loss": 0.0236, "step": 30130 }, { "epoch": 0.33, "learning_rate": 0.0002511253810728416, "loss": 0.0221, "step": 30140 }, { "epoch": 0.33, "learning_rate": 0.00025110916520723874, "loss": 0.0243, "step": 30150 }, { "epoch": 0.33, "learning_rate": 0.0002510929493416358, "loss": 0.0211, "step": 30160 }, { "epoch": 0.33, "learning_rate": 0.00025107673347603293, "loss": 0.0277, "step": 30170 }, { "epoch": 0.33, "learning_rate": 0.00025106051761043005, "loss": 0.0247, "step": 30180 }, { "epoch": 0.33, "learning_rate": 0.0002510443017448271, "loss": 0.0238, "step": 30190 }, { "epoch": 0.33, "learning_rate": 0.0002510280858792242, "loss": 0.0274, "step": 30200 }, { "epoch": 0.33, "learning_rate": 0.0002510118700136213, "loss": 0.024, "step": 30210 }, { "epoch": 0.33, "learning_rate": 0.0002509956541480184, "loss": 0.0216, "step": 30220 }, { "epoch": 0.33, "learning_rate": 0.0002509794382824155, "loss": 0.0233, "step": 30230 }, { "epoch": 0.33, "learning_rate": 0.0002509632224168126, "loss": 0.0279, "step": 30240 }, { "epoch": 0.33, "learning_rate": 0.00025094700655120967, "loss": 0.0213, "step": 30250 }, { "epoch": 0.33, "learning_rate": 0.0002509307906856068, "loss": 0.0215, "step": 30260 }, { "epoch": 0.33, "learning_rate": 0.00025091457482000386, "loss": 0.0249, "step": 30270 }, { "epoch": 0.33, "learning_rate": 0.000250898358954401, "loss": 0.0257, "step": 30280 }, { "epoch": 0.33, "learning_rate": 0.00025088214308879804, "loss": 0.0213, "step": 30290 }, { "epoch": 0.33, "learning_rate": 0.00025086592722319516, "loss": 0.0271, "step": 30300 }, { "epoch": 0.33, "learning_rate": 0.0002508497113575923, "loss": 0.0262, "step": 30310 }, { "epoch": 0.33, "learning_rate": 0.00025083349549198935, "loss": 0.0265, "step": 30320 }, { "epoch": 0.33, "learning_rate": 0.0002508172796263864, "loss": 0.022, "step": 30330 }, { "epoch": 0.33, "learning_rate": 0.00025080106376078353, "loss": 0.0211, "step": 30340 }, { "epoch": 0.33, "learning_rate": 0.00025078484789518065, "loss": 0.0256, "step": 30350 }, { "epoch": 0.33, "learning_rate": 0.0002507686320295777, "loss": 0.0234, "step": 30360 }, { "epoch": 0.33, "learning_rate": 0.0002507524161639748, "loss": 0.0211, "step": 30370 }, { "epoch": 0.33, "learning_rate": 0.0002507362002983719, "loss": 0.0249, "step": 30380 }, { "epoch": 0.33, "learning_rate": 0.000250719984432769, "loss": 0.0239, "step": 30390 }, { "epoch": 0.33, "learning_rate": 0.0002507037685671661, "loss": 0.0248, "step": 30400 }, { "epoch": 0.33, "learning_rate": 0.00025068755270156315, "loss": 0.0215, "step": 30410 }, { "epoch": 0.33, "learning_rate": 0.0002506713368359603, "loss": 0.0217, "step": 30420 }, { "epoch": 0.33, "learning_rate": 0.0002506551209703574, "loss": 0.0238, "step": 30430 }, { "epoch": 0.33, "learning_rate": 0.00025063890510475446, "loss": 0.0232, "step": 30440 }, { "epoch": 0.33, "learning_rate": 0.0002506226892391516, "loss": 0.0223, "step": 30450 }, { "epoch": 0.33, "learning_rate": 0.00025060647337354864, "loss": 0.0228, "step": 30460 }, { "epoch": 0.33, "learning_rate": 0.00025059025750794576, "loss": 0.0248, "step": 30470 }, { "epoch": 0.33, "learning_rate": 0.0002505740416423429, "loss": 0.0241, "step": 30480 }, { "epoch": 0.33, "learning_rate": 0.00025055782577673995, "loss": 0.0263, "step": 30490 }, { "epoch": 0.33, "learning_rate": 0.000250541609911137, "loss": 0.0217, "step": 30500 }, { "epoch": 0.33, "learning_rate": 0.00025052539404553414, "loss": 0.0247, "step": 30510 }, { "epoch": 0.33, "learning_rate": 0.00025050917817993126, "loss": 0.02, "step": 30520 }, { "epoch": 0.33, "learning_rate": 0.0002504929623143283, "loss": 0.0244, "step": 30530 }, { "epoch": 0.33, "learning_rate": 0.0002504767464487254, "loss": 0.0248, "step": 30540 }, { "epoch": 0.33, "learning_rate": 0.0002504605305831225, "loss": 0.0241, "step": 30550 }, { "epoch": 0.33, "learning_rate": 0.0002504443147175196, "loss": 0.0223, "step": 30560 }, { "epoch": 0.33, "learning_rate": 0.0002504280988519167, "loss": 0.0235, "step": 30570 }, { "epoch": 0.33, "learning_rate": 0.00025041188298631376, "loss": 0.0203, "step": 30580 }, { "epoch": 0.33, "learning_rate": 0.0002503956671207109, "loss": 0.0212, "step": 30590 }, { "epoch": 0.33, "learning_rate": 0.000250379451255108, "loss": 0.0244, "step": 30600 }, { "epoch": 0.33, "learning_rate": 0.00025036323538950506, "loss": 0.0225, "step": 30610 }, { "epoch": 0.33, "learning_rate": 0.0002503470195239022, "loss": 0.023, "step": 30620 }, { "epoch": 0.33, "learning_rate": 0.00025033080365829925, "loss": 0.0247, "step": 30630 }, { "epoch": 0.33, "learning_rate": 0.00025031458779269637, "loss": 0.0249, "step": 30640 }, { "epoch": 0.33, "learning_rate": 0.00025029837192709343, "loss": 0.0289, "step": 30650 }, { "epoch": 0.33, "learning_rate": 0.00025028215606149055, "loss": 0.0242, "step": 30660 }, { "epoch": 0.33, "learning_rate": 0.0002502659401958876, "loss": 0.0245, "step": 30670 }, { "epoch": 0.33, "learning_rate": 0.00025024972433028474, "loss": 0.0249, "step": 30680 }, { "epoch": 0.33, "learning_rate": 0.0002502335084646818, "loss": 0.0184, "step": 30690 }, { "epoch": 0.33, "learning_rate": 0.0002502172925990789, "loss": 0.0227, "step": 30700 }, { "epoch": 0.33, "learning_rate": 0.000250201076733476, "loss": 0.0228, "step": 30710 }, { "epoch": 0.33, "learning_rate": 0.0002501848608678731, "loss": 0.0262, "step": 30720 }, { "epoch": 0.33, "learning_rate": 0.0002501686450022702, "loss": 0.0207, "step": 30730 }, { "epoch": 0.33, "learning_rate": 0.0002501524291366673, "loss": 0.0201, "step": 30740 }, { "epoch": 0.33, "learning_rate": 0.0002501362132710644, "loss": 0.0194, "step": 30750 }, { "epoch": 0.33, "learning_rate": 0.0002501199974054615, "loss": 0.0337, "step": 30760 }, { "epoch": 0.33, "learning_rate": 0.00025010378153985855, "loss": 0.0294, "step": 30770 }, { "epoch": 0.33, "learning_rate": 0.00025008756567425567, "loss": 0.0249, "step": 30780 }, { "epoch": 0.33, "learning_rate": 0.0002500713498086528, "loss": 0.0222, "step": 30790 }, { "epoch": 0.33, "learning_rate": 0.00025005513394304985, "loss": 0.0223, "step": 30800 }, { "epoch": 0.33, "learning_rate": 0.0002500389180774469, "loss": 0.0232, "step": 30810 }, { "epoch": 0.33, "learning_rate": 0.00025002270221184404, "loss": 0.0246, "step": 30820 }, { "epoch": 0.33, "learning_rate": 0.00025000648634624116, "loss": 0.0284, "step": 30830 }, { "epoch": 0.33, "learning_rate": 0.0002499902704806382, "loss": 0.0254, "step": 30840 }, { "epoch": 0.33, "learning_rate": 0.0002499740546150353, "loss": 0.0212, "step": 30850 }, { "epoch": 0.33, "learning_rate": 0.0002499578387494324, "loss": 0.0261, "step": 30860 }, { "epoch": 0.33, "learning_rate": 0.00024994162288382953, "loss": 0.0294, "step": 30870 }, { "epoch": 0.33, "learning_rate": 0.0002499254070182266, "loss": 0.0207, "step": 30880 }, { "epoch": 0.33, "learning_rate": 0.0002499091911526237, "loss": 0.0252, "step": 30890 }, { "epoch": 0.33, "learning_rate": 0.0002498929752870208, "loss": 0.0237, "step": 30900 }, { "epoch": 0.33, "learning_rate": 0.0002498767594214179, "loss": 0.0234, "step": 30910 }, { "epoch": 0.33, "learning_rate": 0.000249860543555815, "loss": 0.0208, "step": 30920 }, { "epoch": 0.33, "learning_rate": 0.0002498443276902121, "loss": 0.0234, "step": 30930 }, { "epoch": 0.33, "learning_rate": 0.00024982811182460915, "loss": 0.0235, "step": 30940 }, { "epoch": 0.33, "learning_rate": 0.00024981189595900627, "loss": 0.0232, "step": 30950 }, { "epoch": 0.33, "learning_rate": 0.0002497956800934034, "loss": 0.0235, "step": 30960 }, { "epoch": 0.33, "learning_rate": 0.00024977946422780046, "loss": 0.0239, "step": 30970 }, { "epoch": 0.33, "learning_rate": 0.0002497632483621975, "loss": 0.0221, "step": 30980 }, { "epoch": 0.34, "learning_rate": 0.00024974703249659464, "loss": 0.0241, "step": 30990 }, { "epoch": 0.34, "learning_rate": 0.00024973081663099176, "loss": 0.0223, "step": 31000 }, { "epoch": 0.34, "eval_cer": 0.92159989715741, "eval_loss": 0.01651957258582115, "eval_runtime": 121.4844, "eval_samples_per_second": 16.463, "eval_steps_per_second": 4.116, "step": 31000 }, { "epoch": 0.34, "learning_rate": 0.0002497146007653888, "loss": 0.0224, "step": 31010 }, { "epoch": 0.34, "learning_rate": 0.0002496983848997859, "loss": 0.0207, "step": 31020 }, { "epoch": 0.34, "learning_rate": 0.000249682169034183, "loss": 0.0226, "step": 31030 }, { "epoch": 0.34, "learning_rate": 0.00024966595316858013, "loss": 0.0219, "step": 31040 }, { "epoch": 0.34, "learning_rate": 0.00024964973730297725, "loss": 0.0226, "step": 31050 }, { "epoch": 0.34, "learning_rate": 0.0002496335214373743, "loss": 0.0221, "step": 31060 }, { "epoch": 0.34, "learning_rate": 0.0002496173055717714, "loss": 0.0184, "step": 31070 }, { "epoch": 0.34, "learning_rate": 0.0002496010897061685, "loss": 0.0215, "step": 31080 }, { "epoch": 0.34, "learning_rate": 0.0002495848738405656, "loss": 0.0216, "step": 31090 }, { "epoch": 0.34, "learning_rate": 0.0002495686579749627, "loss": 0.0281, "step": 31100 }, { "epoch": 0.34, "learning_rate": 0.00024955244210935975, "loss": 0.0219, "step": 31110 }, { "epoch": 0.34, "learning_rate": 0.0002495362262437569, "loss": 0.0261, "step": 31120 }, { "epoch": 0.34, "learning_rate": 0.000249520010378154, "loss": 0.0255, "step": 31130 }, { "epoch": 0.34, "learning_rate": 0.00024950379451255106, "loss": 0.0264, "step": 31140 }, { "epoch": 0.34, "learning_rate": 0.0002494875786469481, "loss": 0.0247, "step": 31150 }, { "epoch": 0.34, "learning_rate": 0.00024947136278134524, "loss": 0.0248, "step": 31160 }, { "epoch": 0.34, "learning_rate": 0.00024945514691574236, "loss": 0.0321, "step": 31170 }, { "epoch": 0.34, "learning_rate": 0.00024943893105013943, "loss": 0.0244, "step": 31180 }, { "epoch": 0.34, "learning_rate": 0.00024942271518453655, "loss": 0.0266, "step": 31190 }, { "epoch": 0.34, "learning_rate": 0.0002494064993189336, "loss": 0.023, "step": 31200 }, { "epoch": 0.34, "learning_rate": 0.00024939028345333074, "loss": 0.0238, "step": 31210 }, { "epoch": 0.34, "learning_rate": 0.0002493740675877278, "loss": 0.0194, "step": 31220 }, { "epoch": 0.34, "learning_rate": 0.0002493578517221249, "loss": 0.02, "step": 31230 }, { "epoch": 0.34, "learning_rate": 0.000249341635856522, "loss": 0.0227, "step": 31240 }, { "epoch": 0.34, "learning_rate": 0.0002493254199909191, "loss": 0.0253, "step": 31250 }, { "epoch": 0.34, "learning_rate": 0.00024930920412531617, "loss": 0.0218, "step": 31260 }, { "epoch": 0.34, "learning_rate": 0.0002492929882597133, "loss": 0.0266, "step": 31270 }, { "epoch": 0.34, "learning_rate": 0.00024927677239411036, "loss": 0.0227, "step": 31280 }, { "epoch": 0.34, "learning_rate": 0.0002492605565285075, "loss": 0.0262, "step": 31290 }, { "epoch": 0.34, "learning_rate": 0.00024924434066290454, "loss": 0.0231, "step": 31300 }, { "epoch": 0.34, "learning_rate": 0.00024922812479730166, "loss": 0.0232, "step": 31310 }, { "epoch": 0.34, "learning_rate": 0.0002492119089316988, "loss": 0.0218, "step": 31320 }, { "epoch": 0.34, "learning_rate": 0.00024919569306609585, "loss": 0.0194, "step": 31330 }, { "epoch": 0.34, "learning_rate": 0.0002491794772004929, "loss": 0.0277, "step": 31340 }, { "epoch": 0.34, "learning_rate": 0.00024916326133489003, "loss": 0.0198, "step": 31350 }, { "epoch": 0.34, "learning_rate": 0.00024914704546928715, "loss": 0.0209, "step": 31360 }, { "epoch": 0.34, "learning_rate": 0.0002491308296036842, "loss": 0.0188, "step": 31370 }, { "epoch": 0.34, "learning_rate": 0.0002491146137380813, "loss": 0.0211, "step": 31380 }, { "epoch": 0.34, "learning_rate": 0.0002490983978724784, "loss": 0.0255, "step": 31390 }, { "epoch": 0.34, "learning_rate": 0.0002490821820068755, "loss": 0.0222, "step": 31400 }, { "epoch": 0.34, "learning_rate": 0.0002490659661412726, "loss": 0.0262, "step": 31410 }, { "epoch": 0.34, "learning_rate": 0.00024904975027566966, "loss": 0.0219, "step": 31420 }, { "epoch": 0.34, "learning_rate": 0.0002490335344100668, "loss": 0.0213, "step": 31430 }, { "epoch": 0.34, "learning_rate": 0.0002490173185444639, "loss": 0.0221, "step": 31440 }, { "epoch": 0.34, "learning_rate": 0.00024900110267886096, "loss": 0.0435, "step": 31450 }, { "epoch": 0.34, "learning_rate": 0.0002489848868132581, "loss": 0.0214, "step": 31460 }, { "epoch": 0.34, "learning_rate": 0.00024896867094765515, "loss": 0.0214, "step": 31470 }, { "epoch": 0.34, "learning_rate": 0.00024895245508205227, "loss": 0.0237, "step": 31480 }, { "epoch": 0.34, "learning_rate": 0.0002489362392164494, "loss": 0.0207, "step": 31490 }, { "epoch": 0.34, "learning_rate": 0.00024892002335084645, "loss": 0.0238, "step": 31500 }, { "epoch": 0.34, "learning_rate": 0.0002489038074852435, "loss": 0.0212, "step": 31510 }, { "epoch": 0.34, "learning_rate": 0.00024888759161964064, "loss": 0.0211, "step": 31520 }, { "epoch": 0.34, "learning_rate": 0.00024887137575403776, "loss": 0.0219, "step": 31530 }, { "epoch": 0.34, "learning_rate": 0.0002488551598884348, "loss": 0.0257, "step": 31540 }, { "epoch": 0.34, "learning_rate": 0.0002488389440228319, "loss": 0.0266, "step": 31550 }, { "epoch": 0.34, "learning_rate": 0.000248822728157229, "loss": 0.0196, "step": 31560 }, { "epoch": 0.34, "learning_rate": 0.00024880651229162613, "loss": 0.0201, "step": 31570 }, { "epoch": 0.34, "learning_rate": 0.0002487902964260232, "loss": 0.0218, "step": 31580 }, { "epoch": 0.34, "learning_rate": 0.00024877408056042026, "loss": 0.0222, "step": 31590 }, { "epoch": 0.34, "learning_rate": 0.0002487578646948174, "loss": 0.0189, "step": 31600 }, { "epoch": 0.34, "learning_rate": 0.0002487416488292145, "loss": 0.0208, "step": 31610 }, { "epoch": 0.34, "learning_rate": 0.00024872543296361157, "loss": 0.0231, "step": 31620 }, { "epoch": 0.34, "learning_rate": 0.0002487092170980087, "loss": 0.0233, "step": 31630 }, { "epoch": 0.34, "learning_rate": 0.00024869300123240575, "loss": 0.022, "step": 31640 }, { "epoch": 0.34, "learning_rate": 0.00024867678536680287, "loss": 0.021, "step": 31650 }, { "epoch": 0.34, "learning_rate": 0.0002486605695012, "loss": 0.0196, "step": 31660 }, { "epoch": 0.34, "learning_rate": 0.00024864435363559706, "loss": 0.0187, "step": 31670 }, { "epoch": 0.34, "learning_rate": 0.0002486281377699941, "loss": 0.0208, "step": 31680 }, { "epoch": 0.34, "learning_rate": 0.00024861192190439124, "loss": 0.0213, "step": 31690 }, { "epoch": 0.34, "learning_rate": 0.00024859570603878836, "loss": 0.0208, "step": 31700 }, { "epoch": 0.34, "learning_rate": 0.00024857949017318543, "loss": 0.0196, "step": 31710 }, { "epoch": 0.34, "learning_rate": 0.0002485632743075825, "loss": 0.025, "step": 31720 }, { "epoch": 0.34, "learning_rate": 0.0002485470584419796, "loss": 0.0241, "step": 31730 }, { "epoch": 0.34, "learning_rate": 0.00024853084257637673, "loss": 0.0192, "step": 31740 }, { "epoch": 0.34, "learning_rate": 0.0002485146267107738, "loss": 0.0225, "step": 31750 }, { "epoch": 0.34, "learning_rate": 0.0002484984108451709, "loss": 0.0199, "step": 31760 }, { "epoch": 0.34, "learning_rate": 0.000248482194979568, "loss": 0.0225, "step": 31770 }, { "epoch": 0.34, "learning_rate": 0.0002484659791139651, "loss": 0.0256, "step": 31780 }, { "epoch": 0.34, "learning_rate": 0.00024844976324836217, "loss": 0.0233, "step": 31790 }, { "epoch": 0.34, "learning_rate": 0.0002484335473827593, "loss": 0.0433, "step": 31800 }, { "epoch": 0.34, "learning_rate": 0.00024841733151715635, "loss": 0.0341, "step": 31810 }, { "epoch": 0.34, "learning_rate": 0.0002484011156515535, "loss": 0.0204, "step": 31820 }, { "epoch": 0.34, "learning_rate": 0.00024838489978595054, "loss": 0.0215, "step": 31830 }, { "epoch": 0.34, "learning_rate": 0.00024836868392034766, "loss": 0.0257, "step": 31840 }, { "epoch": 0.34, "learning_rate": 0.0002483524680547447, "loss": 0.0258, "step": 31850 }, { "epoch": 0.34, "learning_rate": 0.00024833625218914185, "loss": 0.0263, "step": 31860 }, { "epoch": 0.34, "learning_rate": 0.0002483200363235389, "loss": 0.025, "step": 31870 }, { "epoch": 0.34, "learning_rate": 0.00024830382045793603, "loss": 0.026, "step": 31880 }, { "epoch": 0.34, "learning_rate": 0.0002482876045923331, "loss": 0.0276, "step": 31890 }, { "epoch": 0.34, "learning_rate": 0.0002482713887267302, "loss": 0.0263, "step": 31900 }, { "epoch": 0.34, "learning_rate": 0.0002482551728611273, "loss": 0.0322, "step": 31910 }, { "epoch": 0.35, "learning_rate": 0.0002482389569955244, "loss": 0.0224, "step": 31920 }, { "epoch": 0.35, "learning_rate": 0.0002482227411299215, "loss": 0.0223, "step": 31930 }, { "epoch": 0.35, "learning_rate": 0.0002482065252643186, "loss": 0.0247, "step": 31940 }, { "epoch": 0.35, "learning_rate": 0.00024819030939871565, "loss": 0.0209, "step": 31950 }, { "epoch": 0.35, "learning_rate": 0.00024817409353311277, "loss": 0.0237, "step": 31960 }, { "epoch": 0.35, "learning_rate": 0.0002481578776675099, "loss": 0.0257, "step": 31970 }, { "epoch": 0.35, "learning_rate": 0.00024814166180190696, "loss": 0.0233, "step": 31980 }, { "epoch": 0.35, "learning_rate": 0.000248125445936304, "loss": 0.0204, "step": 31990 }, { "epoch": 0.35, "learning_rate": 0.00024810923007070114, "loss": 0.0219, "step": 32000 }, { "epoch": 0.35, "eval_cer": 0.9215825250982824, "eval_loss": 0.016736265271902084, "eval_runtime": 121.554, "eval_samples_per_second": 16.454, "eval_steps_per_second": 4.113, "step": 32000 }, { "epoch": 0.35, "learning_rate": 0.00024809301420509826, "loss": 0.0264, "step": 32010 }, { "epoch": 0.35, "learning_rate": 0.00024807679833949533, "loss": 0.025, "step": 32020 }, { "epoch": 0.35, "learning_rate": 0.0002480605824738924, "loss": 0.022, "step": 32030 }, { "epoch": 0.35, "learning_rate": 0.0002480443666082895, "loss": 0.0244, "step": 32040 }, { "epoch": 0.35, "learning_rate": 0.00024802815074268663, "loss": 0.0212, "step": 32050 }, { "epoch": 0.35, "learning_rate": 0.00024801193487708375, "loss": 0.0234, "step": 32060 }, { "epoch": 0.35, "learning_rate": 0.0002479957190114808, "loss": 0.0208, "step": 32070 }, { "epoch": 0.35, "learning_rate": 0.0002479795031458779, "loss": 0.0227, "step": 32080 }, { "epoch": 0.35, "learning_rate": 0.000247963287280275, "loss": 0.0266, "step": 32090 }, { "epoch": 0.35, "learning_rate": 0.0002479470714146721, "loss": 0.0215, "step": 32100 }, { "epoch": 0.35, "learning_rate": 0.0002479308555490692, "loss": 0.0217, "step": 32110 }, { "epoch": 0.35, "learning_rate": 0.00024791463968346626, "loss": 0.0221, "step": 32120 }, { "epoch": 0.35, "learning_rate": 0.0002478984238178634, "loss": 0.0193, "step": 32130 }, { "epoch": 0.35, "learning_rate": 0.0002478822079522605, "loss": 0.0239, "step": 32140 }, { "epoch": 0.35, "learning_rate": 0.00024786599208665756, "loss": 0.023, "step": 32150 }, { "epoch": 0.35, "learning_rate": 0.00024784977622105463, "loss": 0.02, "step": 32160 }, { "epoch": 0.35, "learning_rate": 0.00024783356035545175, "loss": 0.0223, "step": 32170 }, { "epoch": 0.35, "learning_rate": 0.00024781734448984887, "loss": 0.0236, "step": 32180 }, { "epoch": 0.35, "learning_rate": 0.00024780112862424593, "loss": 0.0193, "step": 32190 }, { "epoch": 0.35, "learning_rate": 0.00024778491275864305, "loss": 0.0211, "step": 32200 }, { "epoch": 0.35, "learning_rate": 0.0002477686968930401, "loss": 0.023, "step": 32210 }, { "epoch": 0.35, "learning_rate": 0.00024775248102743724, "loss": 0.022, "step": 32220 }, { "epoch": 0.35, "learning_rate": 0.0002477362651618343, "loss": 0.0231, "step": 32230 }, { "epoch": 0.35, "learning_rate": 0.0002477200492962314, "loss": 0.0194, "step": 32240 }, { "epoch": 0.35, "learning_rate": 0.0002477038334306285, "loss": 0.0245, "step": 32250 }, { "epoch": 0.35, "learning_rate": 0.0002476876175650256, "loss": 0.021, "step": 32260 }, { "epoch": 0.35, "learning_rate": 0.0002476714016994227, "loss": 0.0243, "step": 32270 }, { "epoch": 0.35, "learning_rate": 0.0002476551858338198, "loss": 0.0252, "step": 32280 }, { "epoch": 0.35, "learning_rate": 0.00024763896996821686, "loss": 0.0268, "step": 32290 }, { "epoch": 0.35, "learning_rate": 0.000247622754102614, "loss": 0.0233, "step": 32300 }, { "epoch": 0.35, "learning_rate": 0.00024760653823701105, "loss": 0.0227, "step": 32310 }, { "epoch": 0.35, "learning_rate": 0.00024759032237140817, "loss": 0.0217, "step": 32320 }, { "epoch": 0.35, "learning_rate": 0.0002475741065058053, "loss": 0.0239, "step": 32330 }, { "epoch": 0.35, "learning_rate": 0.00024755789064020235, "loss": 0.0288, "step": 32340 }, { "epoch": 0.35, "learning_rate": 0.0002475416747745994, "loss": 0.0281, "step": 32350 }, { "epoch": 0.35, "learning_rate": 0.00024752545890899654, "loss": 0.0226, "step": 32360 }, { "epoch": 0.35, "learning_rate": 0.00024750924304339366, "loss": 0.0199, "step": 32370 }, { "epoch": 0.35, "learning_rate": 0.0002474930271777907, "loss": 0.0186, "step": 32380 }, { "epoch": 0.35, "learning_rate": 0.00024747681131218784, "loss": 0.0227, "step": 32390 }, { "epoch": 0.35, "learning_rate": 0.0002474605954465849, "loss": 0.0255, "step": 32400 }, { "epoch": 0.35, "learning_rate": 0.00024744437958098203, "loss": 0.0244, "step": 32410 }, { "epoch": 0.35, "learning_rate": 0.0002474281637153791, "loss": 0.0227, "step": 32420 }, { "epoch": 0.35, "learning_rate": 0.0002474119478497762, "loss": 0.0263, "step": 32430 }, { "epoch": 0.35, "learning_rate": 0.0002473957319841733, "loss": 0.0265, "step": 32440 }, { "epoch": 0.35, "learning_rate": 0.0002473795161185704, "loss": 0.0231, "step": 32450 }, { "epoch": 0.35, "learning_rate": 0.00024736330025296746, "loss": 0.0217, "step": 32460 }, { "epoch": 0.35, "learning_rate": 0.0002473470843873646, "loss": 0.0209, "step": 32470 }, { "epoch": 0.35, "learning_rate": 0.00024733086852176165, "loss": 0.0222, "step": 32480 }, { "epoch": 0.35, "learning_rate": 0.00024731465265615877, "loss": 0.0239, "step": 32490 }, { "epoch": 0.35, "learning_rate": 0.0002472984367905559, "loss": 0.025, "step": 32500 }, { "epoch": 0.35, "learning_rate": 0.00024728222092495296, "loss": 0.0268, "step": 32510 }, { "epoch": 0.35, "learning_rate": 0.00024726600505935, "loss": 0.027, "step": 32520 }, { "epoch": 0.35, "learning_rate": 0.00024724978919374714, "loss": 0.0247, "step": 32530 }, { "epoch": 0.35, "learning_rate": 0.00024723357332814426, "loss": 0.022, "step": 32540 }, { "epoch": 0.35, "learning_rate": 0.0002472173574625413, "loss": 0.0203, "step": 32550 }, { "epoch": 0.35, "learning_rate": 0.0002472011415969384, "loss": 0.023, "step": 32560 }, { "epoch": 0.35, "learning_rate": 0.0002471849257313355, "loss": 0.025, "step": 32570 }, { "epoch": 0.35, "learning_rate": 0.00024716870986573263, "loss": 0.025, "step": 32580 }, { "epoch": 0.35, "learning_rate": 0.0002471524940001297, "loss": 0.0239, "step": 32590 }, { "epoch": 0.35, "learning_rate": 0.00024713627813452676, "loss": 0.0221, "step": 32600 }, { "epoch": 0.35, "learning_rate": 0.0002471200622689239, "loss": 0.0199, "step": 32610 }, { "epoch": 0.35, "learning_rate": 0.000247103846403321, "loss": 0.0224, "step": 32620 }, { "epoch": 0.35, "learning_rate": 0.0002470876305377181, "loss": 0.0226, "step": 32630 }, { "epoch": 0.35, "learning_rate": 0.0002470714146721152, "loss": 0.0228, "step": 32640 }, { "epoch": 0.35, "learning_rate": 0.00024705519880651225, "loss": 0.0234, "step": 32650 }, { "epoch": 0.35, "learning_rate": 0.0002470389829409094, "loss": 0.0255, "step": 32660 }, { "epoch": 0.35, "learning_rate": 0.0002470227670753065, "loss": 0.0197, "step": 32670 }, { "epoch": 0.35, "learning_rate": 0.00024700655120970356, "loss": 0.0172, "step": 32680 }, { "epoch": 0.35, "learning_rate": 0.0002469903353441006, "loss": 0.0221, "step": 32690 }, { "epoch": 0.35, "learning_rate": 0.00024697411947849774, "loss": 0.0247, "step": 32700 }, { "epoch": 0.35, "learning_rate": 0.00024695790361289486, "loss": 0.0195, "step": 32710 }, { "epoch": 0.35, "learning_rate": 0.00024694168774729193, "loss": 0.0215, "step": 32720 }, { "epoch": 0.35, "learning_rate": 0.000246925471881689, "loss": 0.021, "step": 32730 }, { "epoch": 0.35, "learning_rate": 0.0002469092560160861, "loss": 0.0235, "step": 32740 }, { "epoch": 0.35, "learning_rate": 0.00024689304015048324, "loss": 0.0225, "step": 32750 }, { "epoch": 0.35, "learning_rate": 0.0002468768242848803, "loss": 0.0223, "step": 32760 }, { "epoch": 0.35, "learning_rate": 0.0002468606084192774, "loss": 0.0231, "step": 32770 }, { "epoch": 0.35, "learning_rate": 0.0002468443925536745, "loss": 0.0212, "step": 32780 }, { "epoch": 0.35, "learning_rate": 0.0002468281766880716, "loss": 0.021, "step": 32790 }, { "epoch": 0.35, "learning_rate": 0.00024681196082246867, "loss": 0.0197, "step": 32800 }, { "epoch": 0.35, "learning_rate": 0.0002467957449568658, "loss": 0.0218, "step": 32810 }, { "epoch": 0.35, "learning_rate": 0.00024677952909126286, "loss": 0.0214, "step": 32820 }, { "epoch": 0.35, "learning_rate": 0.00024676331322566, "loss": 0.0213, "step": 32830 }, { "epoch": 0.36, "learning_rate": 0.00024674709736005704, "loss": 0.0215, "step": 32840 }, { "epoch": 0.36, "learning_rate": 0.00024673088149445416, "loss": 0.0225, "step": 32850 }, { "epoch": 0.36, "learning_rate": 0.00024671466562885123, "loss": 0.0259, "step": 32860 }, { "epoch": 0.36, "learning_rate": 0.00024669844976324835, "loss": 0.0235, "step": 32870 }, { "epoch": 0.36, "learning_rate": 0.0002466822338976454, "loss": 0.0214, "step": 32880 }, { "epoch": 0.36, "learning_rate": 0.00024666601803204253, "loss": 0.0238, "step": 32890 }, { "epoch": 0.36, "learning_rate": 0.0002466498021664396, "loss": 0.0237, "step": 32900 }, { "epoch": 0.36, "learning_rate": 0.0002466335863008367, "loss": 0.0228, "step": 32910 }, { "epoch": 0.36, "learning_rate": 0.0002466173704352338, "loss": 0.0249, "step": 32920 }, { "epoch": 0.36, "learning_rate": 0.0002466011545696309, "loss": 0.0236, "step": 32930 }, { "epoch": 0.36, "learning_rate": 0.000246584938704028, "loss": 0.02, "step": 32940 }, { "epoch": 0.36, "learning_rate": 0.0002465687228384251, "loss": 0.0225, "step": 32950 }, { "epoch": 0.36, "learning_rate": 0.00024655250697282216, "loss": 0.021, "step": 32960 }, { "epoch": 0.36, "learning_rate": 0.0002465362911072193, "loss": 0.0203, "step": 32970 }, { "epoch": 0.36, "learning_rate": 0.0002465200752416164, "loss": 0.0202, "step": 32980 }, { "epoch": 0.36, "learning_rate": 0.00024650385937601346, "loss": 0.0193, "step": 32990 }, { "epoch": 0.36, "learning_rate": 0.0002464876435104105, "loss": 0.0214, "step": 33000 }, { "epoch": 0.36, "eval_cer": 0.921567758848024, "eval_loss": 0.01648101769387722, "eval_runtime": 121.6437, "eval_samples_per_second": 16.441, "eval_steps_per_second": 4.11, "step": 33000 }, { "epoch": 0.36, "learning_rate": 0.00024647142764480765, "loss": 0.0208, "step": 33010 }, { "epoch": 0.36, "learning_rate": 0.00024645521177920477, "loss": 0.0232, "step": 33020 }, { "epoch": 0.36, "learning_rate": 0.00024643899591360183, "loss": 0.0187, "step": 33030 }, { "epoch": 0.36, "learning_rate": 0.0002464227800479989, "loss": 0.0193, "step": 33040 }, { "epoch": 0.36, "learning_rate": 0.000246406564182396, "loss": 0.0227, "step": 33050 }, { "epoch": 0.36, "learning_rate": 0.00024639034831679314, "loss": 0.0225, "step": 33060 }, { "epoch": 0.36, "learning_rate": 0.00024637413245119026, "loss": 0.0233, "step": 33070 }, { "epoch": 0.36, "learning_rate": 0.0002463579165855873, "loss": 0.0241, "step": 33080 }, { "epoch": 0.36, "learning_rate": 0.0002463417007199844, "loss": 0.0267, "step": 33090 }, { "epoch": 0.36, "learning_rate": 0.0002463254848543815, "loss": 0.0251, "step": 33100 }, { "epoch": 0.36, "learning_rate": 0.00024630926898877863, "loss": 0.0314, "step": 33110 }, { "epoch": 0.36, "learning_rate": 0.0002462930531231757, "loss": 0.0331, "step": 33120 }, { "epoch": 0.36, "learning_rate": 0.00024627683725757276, "loss": 0.0293, "step": 33130 }, { "epoch": 0.36, "learning_rate": 0.0002462606213919699, "loss": 0.027, "step": 33140 }, { "epoch": 0.36, "learning_rate": 0.000246244405526367, "loss": 0.0267, "step": 33150 }, { "epoch": 0.36, "learning_rate": 0.00024622818966076406, "loss": 0.023, "step": 33160 }, { "epoch": 0.36, "learning_rate": 0.00024621197379516113, "loss": 0.0235, "step": 33170 }, { "epoch": 0.36, "learning_rate": 0.00024619575792955825, "loss": 0.0216, "step": 33180 }, { "epoch": 0.36, "learning_rate": 0.00024617954206395537, "loss": 0.0209, "step": 33190 }, { "epoch": 0.36, "learning_rate": 0.00024616332619835244, "loss": 0.0245, "step": 33200 }, { "epoch": 0.36, "learning_rate": 0.00024614711033274956, "loss": 0.0205, "step": 33210 }, { "epoch": 0.36, "learning_rate": 0.0002461308944671466, "loss": 0.0226, "step": 33220 }, { "epoch": 0.36, "learning_rate": 0.00024611467860154374, "loss": 0.0222, "step": 33230 }, { "epoch": 0.36, "learning_rate": 0.00024609846273594086, "loss": 0.023, "step": 33240 }, { "epoch": 0.36, "learning_rate": 0.0002460822468703379, "loss": 0.022, "step": 33250 }, { "epoch": 0.36, "learning_rate": 0.000246066031004735, "loss": 0.0208, "step": 33260 }, { "epoch": 0.36, "learning_rate": 0.0002460498151391321, "loss": 0.0223, "step": 33270 }, { "epoch": 0.36, "learning_rate": 0.00024603359927352923, "loss": 0.0233, "step": 33280 }, { "epoch": 0.36, "learning_rate": 0.0002460173834079263, "loss": 0.0245, "step": 33290 }, { "epoch": 0.36, "learning_rate": 0.00024600116754232336, "loss": 0.0195, "step": 33300 }, { "epoch": 0.36, "learning_rate": 0.0002459849516767205, "loss": 0.022, "step": 33310 }, { "epoch": 0.36, "learning_rate": 0.0002459687358111176, "loss": 0.0249, "step": 33320 }, { "epoch": 0.36, "learning_rate": 0.00024595251994551467, "loss": 0.0244, "step": 33330 }, { "epoch": 0.36, "learning_rate": 0.0002459363040799118, "loss": 0.0245, "step": 33340 }, { "epoch": 0.36, "learning_rate": 0.00024592008821430885, "loss": 0.0218, "step": 33350 }, { "epoch": 0.36, "learning_rate": 0.000245903872348706, "loss": 0.0227, "step": 33360 }, { "epoch": 0.36, "learning_rate": 0.00024588765648310304, "loss": 0.023, "step": 33370 }, { "epoch": 0.36, "learning_rate": 0.00024587144061750016, "loss": 0.0224, "step": 33380 }, { "epoch": 0.36, "learning_rate": 0.0002458552247518972, "loss": 0.019, "step": 33390 }, { "epoch": 0.36, "learning_rate": 0.00024583900888629434, "loss": 0.0236, "step": 33400 }, { "epoch": 0.36, "learning_rate": 0.0002458227930206914, "loss": 0.0245, "step": 33410 }, { "epoch": 0.36, "learning_rate": 0.00024580657715508853, "loss": 0.0221, "step": 33420 }, { "epoch": 0.36, "learning_rate": 0.0002457903612894856, "loss": 0.0277, "step": 33430 }, { "epoch": 0.36, "learning_rate": 0.0002457741454238827, "loss": 0.029, "step": 33440 }, { "epoch": 0.36, "learning_rate": 0.0002457579295582798, "loss": 0.025, "step": 33450 }, { "epoch": 0.36, "learning_rate": 0.0002457417136926769, "loss": 0.0217, "step": 33460 }, { "epoch": 0.36, "learning_rate": 0.00024572549782707397, "loss": 0.0232, "step": 33470 }, { "epoch": 0.36, "learning_rate": 0.0002457092819614711, "loss": 0.0231, "step": 33480 }, { "epoch": 0.36, "learning_rate": 0.00024569306609586815, "loss": 0.021, "step": 33490 }, { "epoch": 0.36, "learning_rate": 0.00024567685023026527, "loss": 0.0235, "step": 33500 }, { "epoch": 0.36, "learning_rate": 0.0002456606343646624, "loss": 0.0239, "step": 33510 }, { "epoch": 0.36, "learning_rate": 0.00024564441849905946, "loss": 0.0211, "step": 33520 }, { "epoch": 0.36, "learning_rate": 0.0002456282026334565, "loss": 0.0218, "step": 33530 }, { "epoch": 0.36, "learning_rate": 0.00024561198676785364, "loss": 0.0244, "step": 33540 }, { "epoch": 0.36, "learning_rate": 0.00024559577090225076, "loss": 0.0229, "step": 33550 }, { "epoch": 0.36, "learning_rate": 0.00024557955503664783, "loss": 0.0207, "step": 33560 }, { "epoch": 0.36, "learning_rate": 0.0002455633391710449, "loss": 0.0234, "step": 33570 }, { "epoch": 0.36, "learning_rate": 0.000245547123305442, "loss": 0.0225, "step": 33580 }, { "epoch": 0.36, "learning_rate": 0.00024553090743983913, "loss": 0.02, "step": 33590 }, { "epoch": 0.36, "learning_rate": 0.0002455146915742362, "loss": 0.0215, "step": 33600 }, { "epoch": 0.36, "learning_rate": 0.00024549847570863327, "loss": 0.019, "step": 33610 }, { "epoch": 0.36, "learning_rate": 0.0002454822598430304, "loss": 0.0201, "step": 33620 }, { "epoch": 0.36, "learning_rate": 0.0002454660439774275, "loss": 0.0231, "step": 33630 }, { "epoch": 0.36, "learning_rate": 0.0002454498281118246, "loss": 0.0218, "step": 33640 }, { "epoch": 0.36, "learning_rate": 0.0002454336122462217, "loss": 0.0271, "step": 33650 }, { "epoch": 0.36, "learning_rate": 0.00024541739638061876, "loss": 0.0204, "step": 33660 }, { "epoch": 0.36, "learning_rate": 0.0002454011805150159, "loss": 0.0236, "step": 33670 }, { "epoch": 0.36, "learning_rate": 0.000245384964649413, "loss": 0.0204, "step": 33680 }, { "epoch": 0.36, "learning_rate": 0.00024536874878381006, "loss": 0.0221, "step": 33690 }, { "epoch": 0.36, "learning_rate": 0.0002453525329182071, "loss": 0.0236, "step": 33700 }, { "epoch": 0.36, "learning_rate": 0.00024533631705260425, "loss": 0.0248, "step": 33710 }, { "epoch": 0.36, "learning_rate": 0.00024532010118700137, "loss": 0.0207, "step": 33720 }, { "epoch": 0.36, "learning_rate": 0.00024530388532139843, "loss": 0.022, "step": 33730 }, { "epoch": 0.36, "learning_rate": 0.0002452876694557955, "loss": 0.0228, "step": 33740 }, { "epoch": 0.36, "learning_rate": 0.0002452714535901926, "loss": 0.0192, "step": 33750 }, { "epoch": 0.36, "learning_rate": 0.00024525523772458974, "loss": 0.0209, "step": 33760 }, { "epoch": 0.37, "learning_rate": 0.0002452390218589868, "loss": 0.0213, "step": 33770 }, { "epoch": 0.37, "learning_rate": 0.0002452228059933839, "loss": 0.0237, "step": 33780 }, { "epoch": 0.37, "learning_rate": 0.000245206590127781, "loss": 0.0203, "step": 33790 }, { "epoch": 0.37, "learning_rate": 0.0002451903742621781, "loss": 0.0231, "step": 33800 }, { "epoch": 0.37, "learning_rate": 0.00024517415839657523, "loss": 0.0237, "step": 33810 }, { "epoch": 0.37, "learning_rate": 0.0002451579425309723, "loss": 0.0204, "step": 33820 }, { "epoch": 0.37, "learning_rate": 0.00024514172666536936, "loss": 0.0226, "step": 33830 }, { "epoch": 0.37, "learning_rate": 0.0002451255107997665, "loss": 0.0191, "step": 33840 }, { "epoch": 0.37, "learning_rate": 0.0002451092949341636, "loss": 0.0222, "step": 33850 }, { "epoch": 0.37, "learning_rate": 0.00024509307906856067, "loss": 0.0215, "step": 33860 }, { "epoch": 0.37, "learning_rate": 0.00024507686320295773, "loss": 0.0226, "step": 33870 }, { "epoch": 0.37, "learning_rate": 0.00024506064733735485, "loss": 0.0274, "step": 33880 }, { "epoch": 0.37, "learning_rate": 0.00024504443147175197, "loss": 0.019, "step": 33890 }, { "epoch": 0.37, "learning_rate": 0.00024502821560614904, "loss": 0.021, "step": 33900 }, { "epoch": 0.37, "learning_rate": 0.0002450119997405461, "loss": 0.0213, "step": 33910 }, { "epoch": 0.37, "learning_rate": 0.0002449957838749432, "loss": 0.0254, "step": 33920 }, { "epoch": 0.37, "learning_rate": 0.00024497956800934034, "loss": 0.0207, "step": 33930 }, { "epoch": 0.37, "learning_rate": 0.0002449633521437374, "loss": 0.0261, "step": 33940 }, { "epoch": 0.37, "learning_rate": 0.0002449471362781345, "loss": 0.0251, "step": 33950 }, { "epoch": 0.37, "learning_rate": 0.0002449309204125316, "loss": 0.0273, "step": 33960 }, { "epoch": 0.37, "learning_rate": 0.0002449147045469287, "loss": 0.0271, "step": 33970 }, { "epoch": 0.37, "learning_rate": 0.0002448984886813258, "loss": 0.0224, "step": 33980 }, { "epoch": 0.37, "learning_rate": 0.0002448822728157229, "loss": 0.0223, "step": 33990 }, { "epoch": 0.37, "learning_rate": 0.00024486605695011996, "loss": 0.0232, "step": 34000 }, { "epoch": 0.37, "eval_cer": 0.9215582042155038, "eval_loss": 0.016336919739842415, "eval_runtime": 121.6996, "eval_samples_per_second": 16.434, "eval_steps_per_second": 4.108, "step": 34000 }, { "epoch": 0.37, "learning_rate": 0.0002448498410845171, "loss": 0.0247, "step": 34010 }, { "epoch": 0.37, "learning_rate": 0.00024483362521891415, "loss": 0.0189, "step": 34020 }, { "epoch": 0.37, "learning_rate": 0.00024481740935331127, "loss": 0.0205, "step": 34030 }, { "epoch": 0.37, "learning_rate": 0.00024480119348770833, "loss": 0.0254, "step": 34040 }, { "epoch": 0.37, "learning_rate": 0.00024478497762210545, "loss": 0.024, "step": 34050 }, { "epoch": 0.37, "learning_rate": 0.0002447687617565025, "loss": 0.0241, "step": 34060 }, { "epoch": 0.37, "learning_rate": 0.00024475254589089964, "loss": 0.021, "step": 34070 }, { "epoch": 0.37, "learning_rate": 0.00024473633002529676, "loss": 0.0193, "step": 34080 }, { "epoch": 0.37, "learning_rate": 0.0002447201141596938, "loss": 0.0209, "step": 34090 }, { "epoch": 0.37, "learning_rate": 0.0002447038982940909, "loss": 0.0192, "step": 34100 }, { "epoch": 0.37, "learning_rate": 0.000244687682428488, "loss": 0.0181, "step": 34110 }, { "epoch": 0.37, "learning_rate": 0.00024467146656288513, "loss": 0.0199, "step": 34120 }, { "epoch": 0.37, "learning_rate": 0.0002446552506972822, "loss": 0.0188, "step": 34130 }, { "epoch": 0.37, "learning_rate": 0.00024463903483167926, "loss": 0.0246, "step": 34140 }, { "epoch": 0.37, "learning_rate": 0.0002446228189660764, "loss": 0.0212, "step": 34150 }, { "epoch": 0.37, "learning_rate": 0.0002446066031004735, "loss": 0.0198, "step": 34160 }, { "epoch": 0.37, "learning_rate": 0.00024459038723487057, "loss": 0.0176, "step": 34170 }, { "epoch": 0.37, "learning_rate": 0.00024457417136926763, "loss": 0.0194, "step": 34180 }, { "epoch": 0.37, "learning_rate": 0.00024455795550366475, "loss": 0.0216, "step": 34190 }, { "epoch": 0.37, "learning_rate": 0.00024454173963806187, "loss": 0.0252, "step": 34200 }, { "epoch": 0.37, "learning_rate": 0.00024452552377245894, "loss": 0.022, "step": 34210 }, { "epoch": 0.37, "learning_rate": 0.00024450930790685606, "loss": 0.0257, "step": 34220 }, { "epoch": 0.37, "learning_rate": 0.0002444930920412531, "loss": 0.0218, "step": 34230 }, { "epoch": 0.37, "learning_rate": 0.00024447687617565024, "loss": 0.0237, "step": 34240 }, { "epoch": 0.37, "learning_rate": 0.00024446066031004736, "loss": 0.0218, "step": 34250 }, { "epoch": 0.37, "learning_rate": 0.00024444444444444443, "loss": 0.025, "step": 34260 }, { "epoch": 0.37, "learning_rate": 0.0002444282285788415, "loss": 0.0198, "step": 34270 }, { "epoch": 0.37, "learning_rate": 0.0002444120127132386, "loss": 0.0203, "step": 34280 }, { "epoch": 0.37, "learning_rate": 0.00024439579684763573, "loss": 0.0237, "step": 34290 }, { "epoch": 0.37, "learning_rate": 0.0002443795809820328, "loss": 0.0275, "step": 34300 }, { "epoch": 0.37, "learning_rate": 0.00024436336511642987, "loss": 0.0194, "step": 34310 }, { "epoch": 0.37, "learning_rate": 0.000244347149250827, "loss": 0.0226, "step": 34320 }, { "epoch": 0.37, "learning_rate": 0.0002443309333852241, "loss": 0.021, "step": 34330 }, { "epoch": 0.37, "learning_rate": 0.00024431471751962117, "loss": 0.0231, "step": 34340 }, { "epoch": 0.37, "learning_rate": 0.0002442985016540183, "loss": 0.0193, "step": 34350 }, { "epoch": 0.37, "learning_rate": 0.00024428228578841536, "loss": 0.0188, "step": 34360 }, { "epoch": 0.37, "learning_rate": 0.0002442660699228125, "loss": 0.0204, "step": 34370 }, { "epoch": 0.37, "learning_rate": 0.00024424985405720954, "loss": 0.0218, "step": 34380 }, { "epoch": 0.37, "learning_rate": 0.00024423363819160666, "loss": 0.021, "step": 34390 }, { "epoch": 0.37, "learning_rate": 0.00024421742232600373, "loss": 0.0226, "step": 34400 }, { "epoch": 0.37, "learning_rate": 0.00024420120646040085, "loss": 0.0181, "step": 34410 }, { "epoch": 0.37, "learning_rate": 0.0002441849905947979, "loss": 0.0198, "step": 34420 }, { "epoch": 0.37, "learning_rate": 0.00024416877472919503, "loss": 0.0204, "step": 34430 }, { "epoch": 0.37, "learning_rate": 0.0002441525588635921, "loss": 0.0226, "step": 34440 }, { "epoch": 0.37, "learning_rate": 0.00024413634299798922, "loss": 0.0204, "step": 34450 }, { "epoch": 0.37, "learning_rate": 0.00024412012713238628, "loss": 0.0243, "step": 34460 }, { "epoch": 0.37, "learning_rate": 0.0002441039112667834, "loss": 0.0209, "step": 34470 }, { "epoch": 0.37, "learning_rate": 0.0002440876954011805, "loss": 0.0235, "step": 34480 }, { "epoch": 0.37, "learning_rate": 0.0002440714795355776, "loss": 0.0199, "step": 34490 }, { "epoch": 0.37, "learning_rate": 0.00024405526366997465, "loss": 0.0259, "step": 34500 }, { "epoch": 0.37, "learning_rate": 0.00024403904780437177, "loss": 0.0215, "step": 34510 }, { "epoch": 0.37, "learning_rate": 0.00024402283193876887, "loss": 0.0254, "step": 34520 }, { "epoch": 0.37, "learning_rate": 0.00024400661607316596, "loss": 0.0204, "step": 34530 }, { "epoch": 0.37, "learning_rate": 0.00024399040020756308, "loss": 0.0234, "step": 34540 }, { "epoch": 0.37, "learning_rate": 0.00024397418434196015, "loss": 0.0275, "step": 34550 }, { "epoch": 0.37, "learning_rate": 0.00024395796847635724, "loss": 0.0195, "step": 34560 }, { "epoch": 0.37, "learning_rate": 0.00024394175261075436, "loss": 0.0204, "step": 34570 }, { "epoch": 0.37, "learning_rate": 0.00024392553674515145, "loss": 0.0225, "step": 34580 }, { "epoch": 0.37, "learning_rate": 0.00024390932087954852, "loss": 0.0221, "step": 34590 }, { "epoch": 0.37, "learning_rate": 0.0002438931050139456, "loss": 0.0224, "step": 34600 }, { "epoch": 0.37, "learning_rate": 0.00024387688914834273, "loss": 0.025, "step": 34610 }, { "epoch": 0.37, "learning_rate": 0.00024386067328273982, "loss": 0.0232, "step": 34620 }, { "epoch": 0.37, "learning_rate": 0.0002438444574171369, "loss": 0.0199, "step": 34630 }, { "epoch": 0.37, "learning_rate": 0.000243828241551534, "loss": 0.0214, "step": 34640 }, { "epoch": 0.37, "learning_rate": 0.0002438120256859311, "loss": 0.0239, "step": 34650 }, { "epoch": 0.37, "learning_rate": 0.0002437958098203282, "loss": 0.022, "step": 34660 }, { "epoch": 0.37, "learning_rate": 0.00024377959395472526, "loss": 0.0216, "step": 34670 }, { "epoch": 0.37, "learning_rate": 0.00024376337808912238, "loss": 0.0231, "step": 34680 }, { "epoch": 0.38, "learning_rate": 0.00024374716222351947, "loss": 0.0237, "step": 34690 }, { "epoch": 0.38, "learning_rate": 0.0002437309463579166, "loss": 0.024, "step": 34700 }, { "epoch": 0.38, "learning_rate": 0.00024371473049231366, "loss": 0.0233, "step": 34710 }, { "epoch": 0.38, "learning_rate": 0.00024369851462671075, "loss": 0.0228, "step": 34720 }, { "epoch": 0.38, "learning_rate": 0.00024368229876110784, "loss": 0.0226, "step": 34730 }, { "epoch": 0.38, "learning_rate": 0.00024366608289550496, "loss": 0.0182, "step": 34740 }, { "epoch": 0.38, "learning_rate": 0.00024364986702990203, "loss": 0.0249, "step": 34750 }, { "epoch": 0.38, "learning_rate": 0.00024363365116429912, "loss": 0.0238, "step": 34760 }, { "epoch": 0.38, "learning_rate": 0.00024361743529869624, "loss": 0.0241, "step": 34770 }, { "epoch": 0.38, "learning_rate": 0.00024360121943309333, "loss": 0.0197, "step": 34780 }, { "epoch": 0.38, "learning_rate": 0.0002435850035674904, "loss": 0.0245, "step": 34790 }, { "epoch": 0.38, "learning_rate": 0.0002435687877018875, "loss": 0.0224, "step": 34800 }, { "epoch": 0.38, "learning_rate": 0.0002435525718362846, "loss": 0.0198, "step": 34810 }, { "epoch": 0.38, "learning_rate": 0.0002435363559706817, "loss": 0.0234, "step": 34820 }, { "epoch": 0.38, "learning_rate": 0.00024352014010507877, "loss": 0.0224, "step": 34830 }, { "epoch": 0.38, "learning_rate": 0.0002435039242394759, "loss": 0.021, "step": 34840 }, { "epoch": 0.38, "learning_rate": 0.00024348770837387298, "loss": 0.0211, "step": 34850 }, { "epoch": 0.38, "learning_rate": 0.00024347149250827007, "loss": 0.0233, "step": 34860 }, { "epoch": 0.38, "learning_rate": 0.00024345527664266714, "loss": 0.0259, "step": 34870 }, { "epoch": 0.38, "learning_rate": 0.00024343906077706426, "loss": 0.0265, "step": 34880 }, { "epoch": 0.38, "learning_rate": 0.00024342284491146135, "loss": 0.0223, "step": 34890 }, { "epoch": 0.38, "learning_rate": 0.00024340662904585845, "loss": 0.0221, "step": 34900 }, { "epoch": 0.38, "learning_rate": 0.00024339041318025554, "loss": 0.0217, "step": 34910 }, { "epoch": 0.38, "learning_rate": 0.00024337419731465263, "loss": 0.022, "step": 34920 }, { "epoch": 0.38, "learning_rate": 0.00024335798144904972, "loss": 0.0228, "step": 34930 }, { "epoch": 0.38, "learning_rate": 0.00024334176558344684, "loss": 0.0257, "step": 34940 }, { "epoch": 0.38, "learning_rate": 0.0002433255497178439, "loss": 0.0234, "step": 34950 }, { "epoch": 0.38, "learning_rate": 0.000243309333852241, "loss": 0.0201, "step": 34960 }, { "epoch": 0.38, "learning_rate": 0.0002432931179866381, "loss": 0.02, "step": 34970 }, { "epoch": 0.38, "learning_rate": 0.00024327690212103522, "loss": 0.0248, "step": 34980 }, { "epoch": 0.38, "learning_rate": 0.00024326068625543228, "loss": 0.0249, "step": 34990 }, { "epoch": 0.38, "learning_rate": 0.00024324447038982937, "loss": 0.0192, "step": 35000 }, { "epoch": 0.38, "eval_cer": 0.9215729704657623, "eval_loss": 0.016215071082115173, "eval_runtime": 121.5329, "eval_samples_per_second": 16.456, "eval_steps_per_second": 4.114, "step": 35000 }, { "epoch": 0.38, "learning_rate": 0.0002432282545242265, "loss": 0.0251, "step": 35010 }, { "epoch": 0.38, "learning_rate": 0.00024321203865862359, "loss": 0.0213, "step": 35020 }, { "epoch": 0.38, "learning_rate": 0.00024319582279302065, "loss": 0.0193, "step": 35030 }, { "epoch": 0.38, "learning_rate": 0.00024317960692741777, "loss": 0.0226, "step": 35040 }, { "epoch": 0.38, "learning_rate": 0.00024316339106181486, "loss": 0.0222, "step": 35050 }, { "epoch": 0.38, "learning_rate": 0.00024314717519621196, "loss": 0.0206, "step": 35060 }, { "epoch": 0.38, "learning_rate": 0.00024313095933060902, "loss": 0.0219, "step": 35070 }, { "epoch": 0.38, "learning_rate": 0.00024311474346500614, "loss": 0.0196, "step": 35080 }, { "epoch": 0.38, "learning_rate": 0.00024309852759940324, "loss": 0.0212, "step": 35090 }, { "epoch": 0.38, "learning_rate": 0.00024308231173380033, "loss": 0.0236, "step": 35100 }, { "epoch": 0.38, "learning_rate": 0.00024306609586819742, "loss": 0.0209, "step": 35110 }, { "epoch": 0.38, "learning_rate": 0.0002430498800025945, "loss": 0.0243, "step": 35120 }, { "epoch": 0.38, "learning_rate": 0.0002430336641369916, "loss": 0.0252, "step": 35130 }, { "epoch": 0.38, "learning_rate": 0.00024301744827138873, "loss": 0.022, "step": 35140 }, { "epoch": 0.38, "learning_rate": 0.0002430012324057858, "loss": 0.0204, "step": 35150 }, { "epoch": 0.38, "learning_rate": 0.00024298501654018288, "loss": 0.0244, "step": 35160 }, { "epoch": 0.38, "learning_rate": 0.00024296880067457998, "loss": 0.024, "step": 35170 }, { "epoch": 0.38, "learning_rate": 0.0002429525848089771, "loss": 0.0191, "step": 35180 }, { "epoch": 0.38, "learning_rate": 0.00024293636894337416, "loss": 0.0204, "step": 35190 }, { "epoch": 0.38, "learning_rate": 0.00024292015307777126, "loss": 0.0203, "step": 35200 }, { "epoch": 0.38, "learning_rate": 0.00024290393721216838, "loss": 0.0187, "step": 35210 }, { "epoch": 0.38, "learning_rate": 0.00024288772134656547, "loss": 0.024, "step": 35220 }, { "epoch": 0.38, "learning_rate": 0.00024287150548096253, "loss": 0.0213, "step": 35230 }, { "epoch": 0.38, "learning_rate": 0.00024285528961535963, "loss": 0.0232, "step": 35240 }, { "epoch": 0.38, "learning_rate": 0.00024283907374975675, "loss": 0.0239, "step": 35250 }, { "epoch": 0.38, "learning_rate": 0.00024282285788415384, "loss": 0.0231, "step": 35260 }, { "epoch": 0.38, "learning_rate": 0.00024280664201855096, "loss": 0.0209, "step": 35270 }, { "epoch": 0.38, "learning_rate": 0.00024279042615294802, "loss": 0.0234, "step": 35280 }, { "epoch": 0.38, "learning_rate": 0.00024277421028734512, "loss": 0.0264, "step": 35290 }, { "epoch": 0.38, "learning_rate": 0.0002427579944217422, "loss": 0.0197, "step": 35300 }, { "epoch": 0.38, "learning_rate": 0.00024274177855613933, "loss": 0.0217, "step": 35310 }, { "epoch": 0.38, "learning_rate": 0.0002427255626905364, "loss": 0.025, "step": 35320 }, { "epoch": 0.38, "learning_rate": 0.0002427093468249335, "loss": 0.0206, "step": 35330 }, { "epoch": 0.38, "learning_rate": 0.0002426931309593306, "loss": 0.0194, "step": 35340 }, { "epoch": 0.38, "learning_rate": 0.0002426769150937277, "loss": 0.0208, "step": 35350 }, { "epoch": 0.38, "learning_rate": 0.00024266069922812477, "loss": 0.0186, "step": 35360 }, { "epoch": 0.38, "learning_rate": 0.00024264448336252186, "loss": 0.0249, "step": 35370 }, { "epoch": 0.38, "learning_rate": 0.00024262826749691898, "loss": 0.0194, "step": 35380 }, { "epoch": 0.38, "learning_rate": 0.00024261205163131607, "loss": 0.0238, "step": 35390 }, { "epoch": 0.38, "learning_rate": 0.00024259583576571314, "loss": 0.0237, "step": 35400 }, { "epoch": 0.38, "learning_rate": 0.00024257961990011026, "loss": 0.0235, "step": 35410 }, { "epoch": 0.38, "learning_rate": 0.00024256340403450735, "loss": 0.0218, "step": 35420 }, { "epoch": 0.38, "learning_rate": 0.00024254718816890444, "loss": 0.021, "step": 35430 }, { "epoch": 0.38, "learning_rate": 0.0002425309723033015, "loss": 0.0213, "step": 35440 }, { "epoch": 0.38, "learning_rate": 0.00024251475643769863, "loss": 0.0237, "step": 35450 }, { "epoch": 0.38, "learning_rate": 0.00024249854057209572, "loss": 0.0212, "step": 35460 }, { "epoch": 0.38, "learning_rate": 0.00024248232470649281, "loss": 0.0222, "step": 35470 }, { "epoch": 0.38, "learning_rate": 0.0002424661088408899, "loss": 0.0189, "step": 35480 }, { "epoch": 0.38, "learning_rate": 0.000242449892975287, "loss": 0.02, "step": 35490 }, { "epoch": 0.38, "learning_rate": 0.0002424336771096841, "loss": 0.0212, "step": 35500 }, { "epoch": 0.38, "learning_rate": 0.0002424174612440812, "loss": 0.0202, "step": 35510 }, { "epoch": 0.38, "learning_rate": 0.00024240124537847828, "loss": 0.0224, "step": 35520 }, { "epoch": 0.38, "learning_rate": 0.00024238502951287537, "loss": 0.0291, "step": 35530 }, { "epoch": 0.38, "learning_rate": 0.00024236881364727246, "loss": 0.0229, "step": 35540 }, { "epoch": 0.38, "learning_rate": 0.00024235259778166958, "loss": 0.0221, "step": 35550 }, { "epoch": 0.38, "learning_rate": 0.00024233638191606665, "loss": 0.0222, "step": 35560 }, { "epoch": 0.38, "learning_rate": 0.00024232016605046374, "loss": 0.0247, "step": 35570 }, { "epoch": 0.38, "learning_rate": 0.00024230395018486086, "loss": 0.023, "step": 35580 }, { "epoch": 0.38, "learning_rate": 0.00024228773431925795, "loss": 0.0227, "step": 35590 }, { "epoch": 0.38, "learning_rate": 0.00024227151845365502, "loss": 0.0186, "step": 35600 }, { "epoch": 0.38, "learning_rate": 0.0002422553025880521, "loss": 0.0219, "step": 35610 }, { "epoch": 0.39, "learning_rate": 0.00024223908672244923, "loss": 0.0199, "step": 35620 }, { "epoch": 0.39, "learning_rate": 0.00024222287085684632, "loss": 0.0234, "step": 35630 }, { "epoch": 0.39, "learning_rate": 0.0002422066549912434, "loss": 0.0207, "step": 35640 }, { "epoch": 0.39, "learning_rate": 0.0002421904391256405, "loss": 0.0218, "step": 35650 }, { "epoch": 0.39, "learning_rate": 0.0002421742232600376, "loss": 0.0213, "step": 35660 }, { "epoch": 0.39, "learning_rate": 0.0002421580073944347, "loss": 0.0196, "step": 35670 }, { "epoch": 0.39, "learning_rate": 0.00024214179152883176, "loss": 0.0185, "step": 35680 }, { "epoch": 0.39, "learning_rate": 0.00024212557566322888, "loss": 0.0231, "step": 35690 }, { "epoch": 0.39, "learning_rate": 0.00024210935979762597, "loss": 0.023, "step": 35700 }, { "epoch": 0.39, "learning_rate": 0.0002420931439320231, "loss": 0.0212, "step": 35710 }, { "epoch": 0.39, "learning_rate": 0.00024207692806642016, "loss": 0.0179, "step": 35720 }, { "epoch": 0.39, "learning_rate": 0.00024206071220081725, "loss": 0.0166, "step": 35730 }, { "epoch": 0.39, "learning_rate": 0.00024204449633521434, "loss": 0.0214, "step": 35740 }, { "epoch": 0.39, "learning_rate": 0.00024202828046961146, "loss": 0.0235, "step": 35750 }, { "epoch": 0.39, "learning_rate": 0.00024201206460400853, "loss": 0.0202, "step": 35760 }, { "epoch": 0.39, "learning_rate": 0.00024199584873840562, "loss": 0.0211, "step": 35770 }, { "epoch": 0.39, "learning_rate": 0.00024197963287280274, "loss": 0.0228, "step": 35780 }, { "epoch": 0.39, "learning_rate": 0.00024196341700719984, "loss": 0.0181, "step": 35790 }, { "epoch": 0.39, "learning_rate": 0.0002419472011415969, "loss": 0.0223, "step": 35800 }, { "epoch": 0.39, "learning_rate": 0.000241930985275994, "loss": 0.0206, "step": 35810 }, { "epoch": 0.39, "learning_rate": 0.00024191476941039111, "loss": 0.0188, "step": 35820 }, { "epoch": 0.39, "learning_rate": 0.0002418985535447882, "loss": 0.02, "step": 35830 }, { "epoch": 0.39, "learning_rate": 0.00024188233767918527, "loss": 0.0196, "step": 35840 }, { "epoch": 0.39, "learning_rate": 0.0002418661218135824, "loss": 0.0269, "step": 35850 }, { "epoch": 0.39, "learning_rate": 0.00024184990594797948, "loss": 0.0172, "step": 35860 }, { "epoch": 0.39, "learning_rate": 0.00024183369008237658, "loss": 0.0191, "step": 35870 }, { "epoch": 0.39, "learning_rate": 0.00024181747421677364, "loss": 0.0188, "step": 35880 }, { "epoch": 0.39, "learning_rate": 0.00024180125835117076, "loss": 0.0241, "step": 35890 }, { "epoch": 0.39, "learning_rate": 0.00024178504248556786, "loss": 0.0193, "step": 35900 }, { "epoch": 0.39, "learning_rate": 0.00024176882661996495, "loss": 0.0243, "step": 35910 }, { "epoch": 0.39, "learning_rate": 0.00024175261075436204, "loss": 0.0209, "step": 35920 }, { "epoch": 0.39, "learning_rate": 0.00024173639488875913, "loss": 0.0218, "step": 35930 }, { "epoch": 0.39, "learning_rate": 0.00024172017902315623, "loss": 0.0232, "step": 35940 }, { "epoch": 0.39, "learning_rate": 0.00024170396315755335, "loss": 0.0222, "step": 35950 }, { "epoch": 0.39, "learning_rate": 0.0002416877472919504, "loss": 0.0201, "step": 35960 }, { "epoch": 0.39, "learning_rate": 0.0002416715314263475, "loss": 0.0221, "step": 35970 }, { "epoch": 0.39, "learning_rate": 0.0002416553155607446, "loss": 0.0188, "step": 35980 }, { "epoch": 0.39, "learning_rate": 0.00024163909969514172, "loss": 0.0208, "step": 35990 }, { "epoch": 0.39, "learning_rate": 0.0002416228838295388, "loss": 0.0159, "step": 36000 }, { "epoch": 0.39, "eval_cer": 0.9215590728184603, "eval_loss": 0.01598510891199112, "eval_runtime": 121.8638, "eval_samples_per_second": 16.412, "eval_steps_per_second": 4.103, "step": 36000 }, { "epoch": 0.39, "learning_rate": 0.00024160666796393588, "loss": 0.0191, "step": 36010 }, { "epoch": 0.39, "learning_rate": 0.000241590452098333, "loss": 0.0232, "step": 36020 }, { "epoch": 0.39, "learning_rate": 0.0002415742362327301, "loss": 0.0218, "step": 36030 }, { "epoch": 0.39, "learning_rate": 0.00024155802036712718, "loss": 0.0173, "step": 36040 }, { "epoch": 0.39, "learning_rate": 0.00024154180450152427, "loss": 0.0229, "step": 36050 }, { "epoch": 0.39, "learning_rate": 0.00024152558863592137, "loss": 0.0228, "step": 36060 }, { "epoch": 0.39, "learning_rate": 0.00024150937277031846, "loss": 0.0248, "step": 36070 }, { "epoch": 0.39, "learning_rate": 0.00024149315690471558, "loss": 0.02, "step": 36080 }, { "epoch": 0.39, "learning_rate": 0.00024147694103911265, "loss": 0.0246, "step": 36090 }, { "epoch": 0.39, "learning_rate": 0.00024146072517350974, "loss": 0.024, "step": 36100 }, { "epoch": 0.39, "learning_rate": 0.00024144450930790683, "loss": 0.0192, "step": 36110 }, { "epoch": 0.39, "learning_rate": 0.00024142829344230395, "loss": 0.0251, "step": 36120 }, { "epoch": 0.39, "learning_rate": 0.00024141207757670102, "loss": 0.021, "step": 36130 }, { "epoch": 0.39, "learning_rate": 0.0002413958617110981, "loss": 0.0239, "step": 36140 }, { "epoch": 0.39, "learning_rate": 0.00024137964584549523, "loss": 0.0245, "step": 36150 }, { "epoch": 0.39, "learning_rate": 0.00024136342997989232, "loss": 0.0245, "step": 36160 }, { "epoch": 0.39, "learning_rate": 0.0002413472141142894, "loss": 0.0215, "step": 36170 }, { "epoch": 0.39, "learning_rate": 0.00024133099824868648, "loss": 0.0197, "step": 36180 }, { "epoch": 0.39, "learning_rate": 0.0002413147823830836, "loss": 0.0264, "step": 36190 }, { "epoch": 0.39, "learning_rate": 0.0002412985665174807, "loss": 0.0251, "step": 36200 }, { "epoch": 0.39, "learning_rate": 0.00024128235065187776, "loss": 0.0208, "step": 36210 }, { "epoch": 0.39, "learning_rate": 0.00024126613478627488, "loss": 0.0171, "step": 36220 }, { "epoch": 0.39, "learning_rate": 0.00024124991892067197, "loss": 0.0198, "step": 36230 }, { "epoch": 0.39, "learning_rate": 0.00024123370305506906, "loss": 0.0258, "step": 36240 }, { "epoch": 0.39, "learning_rate": 0.00024121748718946613, "loss": 0.018, "step": 36250 }, { "epoch": 0.39, "learning_rate": 0.00024120127132386325, "loss": 0.0216, "step": 36260 }, { "epoch": 0.39, "learning_rate": 0.00024118505545826034, "loss": 0.0223, "step": 36270 }, { "epoch": 0.39, "learning_rate": 0.00024116883959265746, "loss": 0.0214, "step": 36280 }, { "epoch": 0.39, "learning_rate": 0.00024115262372705453, "loss": 0.0217, "step": 36290 }, { "epoch": 0.39, "learning_rate": 0.00024113640786145162, "loss": 0.0242, "step": 36300 }, { "epoch": 0.39, "learning_rate": 0.0002411201919958487, "loss": 0.0216, "step": 36310 }, { "epoch": 0.39, "learning_rate": 0.00024110397613024583, "loss": 0.0214, "step": 36320 }, { "epoch": 0.39, "learning_rate": 0.0002410877602646429, "loss": 0.0202, "step": 36330 }, { "epoch": 0.39, "learning_rate": 0.00024107154439904, "loss": 0.0285, "step": 36340 }, { "epoch": 0.39, "learning_rate": 0.0002410553285334371, "loss": 0.0202, "step": 36350 }, { "epoch": 0.39, "learning_rate": 0.0002410391126678342, "loss": 0.0197, "step": 36360 }, { "epoch": 0.39, "learning_rate": 0.00024102289680223127, "loss": 0.0243, "step": 36370 }, { "epoch": 0.39, "learning_rate": 0.00024100668093662836, "loss": 0.0204, "step": 36380 }, { "epoch": 0.39, "learning_rate": 0.00024099046507102548, "loss": 0.0195, "step": 36390 }, { "epoch": 0.39, "learning_rate": 0.00024097424920542257, "loss": 0.022, "step": 36400 }, { "epoch": 0.39, "learning_rate": 0.00024095803333981964, "loss": 0.0226, "step": 36410 }, { "epoch": 0.39, "learning_rate": 0.00024094181747421676, "loss": 0.0212, "step": 36420 }, { "epoch": 0.39, "learning_rate": 0.00024092560160861385, "loss": 0.0209, "step": 36430 }, { "epoch": 0.39, "learning_rate": 0.00024090938574301095, "loss": 0.0221, "step": 36440 }, { "epoch": 0.39, "learning_rate": 0.000240893169877408, "loss": 0.0226, "step": 36450 }, { "epoch": 0.39, "learning_rate": 0.00024087695401180513, "loss": 0.0202, "step": 36460 }, { "epoch": 0.39, "learning_rate": 0.00024086073814620222, "loss": 0.0268, "step": 36470 }, { "epoch": 0.39, "learning_rate": 0.00024084452228059932, "loss": 0.029, "step": 36480 }, { "epoch": 0.39, "learning_rate": 0.0002408283064149964, "loss": 0.0236, "step": 36490 }, { "epoch": 0.39, "learning_rate": 0.0002408120905493935, "loss": 0.0221, "step": 36500 }, { "epoch": 0.39, "learning_rate": 0.0002407958746837906, "loss": 0.0218, "step": 36510 }, { "epoch": 0.39, "learning_rate": 0.00024077965881818771, "loss": 0.0187, "step": 36520 }, { "epoch": 0.39, "learning_rate": 0.00024076344295258478, "loss": 0.0206, "step": 36530 }, { "epoch": 0.4, "learning_rate": 0.00024074722708698187, "loss": 0.0207, "step": 36540 }, { "epoch": 0.4, "learning_rate": 0.00024073101122137897, "loss": 0.0194, "step": 36550 }, { "epoch": 0.4, "learning_rate": 0.00024071479535577609, "loss": 0.0236, "step": 36560 }, { "epoch": 0.4, "learning_rate": 0.00024069857949017315, "loss": 0.0229, "step": 36570 }, { "epoch": 0.4, "learning_rate": 0.00024068236362457024, "loss": 0.0187, "step": 36580 }, { "epoch": 0.4, "learning_rate": 0.00024066614775896736, "loss": 0.0235, "step": 36590 }, { "epoch": 0.4, "learning_rate": 0.00024064993189336446, "loss": 0.0198, "step": 36600 }, { "epoch": 0.4, "learning_rate": 0.00024063371602776152, "loss": 0.0204, "step": 36610 }, { "epoch": 0.4, "learning_rate": 0.00024061750016215861, "loss": 0.0214, "step": 36620 }, { "epoch": 0.4, "learning_rate": 0.00024060128429655573, "loss": 0.0207, "step": 36630 }, { "epoch": 0.4, "learning_rate": 0.00024058506843095283, "loss": 0.0266, "step": 36640 }, { "epoch": 0.4, "learning_rate": 0.0002405688525653499, "loss": 0.0224, "step": 36650 }, { "epoch": 0.4, "learning_rate": 0.000240552636699747, "loss": 0.022, "step": 36660 }, { "epoch": 0.4, "learning_rate": 0.0002405364208341441, "loss": 0.0262, "step": 36670 }, { "epoch": 0.4, "learning_rate": 0.0002405202049685412, "loss": 0.0233, "step": 36680 }, { "epoch": 0.4, "learning_rate": 0.00024050398910293832, "loss": 0.019, "step": 36690 }, { "epoch": 0.4, "learning_rate": 0.00024048777323733538, "loss": 0.0192, "step": 36700 }, { "epoch": 0.4, "learning_rate": 0.00024047155737173248, "loss": 0.0214, "step": 36710 }, { "epoch": 0.4, "learning_rate": 0.0002404553415061296, "loss": 0.0196, "step": 36720 }, { "epoch": 0.4, "learning_rate": 0.0002404391256405267, "loss": 0.0199, "step": 36730 }, { "epoch": 0.4, "learning_rate": 0.00024042290977492375, "loss": 0.02, "step": 36740 }, { "epoch": 0.4, "learning_rate": 0.00024040669390932085, "loss": 0.0213, "step": 36750 }, { "epoch": 0.4, "learning_rate": 0.00024039047804371797, "loss": 0.021, "step": 36760 }, { "epoch": 0.4, "learning_rate": 0.00024037426217811506, "loss": 0.0224, "step": 36770 }, { "epoch": 0.4, "learning_rate": 0.00024035804631251213, "loss": 0.0178, "step": 36780 }, { "epoch": 0.4, "learning_rate": 0.00024034183044690925, "loss": 0.023, "step": 36790 }, { "epoch": 0.4, "learning_rate": 0.00024032561458130634, "loss": 0.0263, "step": 36800 }, { "epoch": 0.4, "learning_rate": 0.00024030939871570343, "loss": 0.0256, "step": 36810 }, { "epoch": 0.4, "learning_rate": 0.0002402931828501005, "loss": 0.0207, "step": 36820 }, { "epoch": 0.4, "learning_rate": 0.00024027696698449762, "loss": 0.0205, "step": 36830 }, { "epoch": 0.4, "learning_rate": 0.0002402607511188947, "loss": 0.02, "step": 36840 }, { "epoch": 0.4, "learning_rate": 0.0002402445352532918, "loss": 0.0192, "step": 36850 }, { "epoch": 0.4, "learning_rate": 0.0002402283193876889, "loss": 0.0187, "step": 36860 }, { "epoch": 0.4, "learning_rate": 0.000240212103522086, "loss": 0.0175, "step": 36870 }, { "epoch": 0.4, "learning_rate": 0.00024019588765648308, "loss": 0.0221, "step": 36880 }, { "epoch": 0.4, "learning_rate": 0.0002401796717908802, "loss": 0.0205, "step": 36890 }, { "epoch": 0.4, "learning_rate": 0.00024016345592527727, "loss": 0.0209, "step": 36900 }, { "epoch": 0.4, "learning_rate": 0.00024014724005967436, "loss": 0.0173, "step": 36910 }, { "epoch": 0.4, "learning_rate": 0.00024013102419407145, "loss": 0.0183, "step": 36920 }, { "epoch": 0.4, "learning_rate": 0.00024011480832846857, "loss": 0.021, "step": 36930 }, { "epoch": 0.4, "learning_rate": 0.00024009859246286564, "loss": 0.0208, "step": 36940 }, { "epoch": 0.4, "learning_rate": 0.00024008237659726273, "loss": 0.0239, "step": 36950 }, { "epoch": 0.4, "learning_rate": 0.00024006616073165985, "loss": 0.0271, "step": 36960 }, { "epoch": 0.4, "learning_rate": 0.00024004994486605694, "loss": 0.0209, "step": 36970 }, { "epoch": 0.4, "learning_rate": 0.000240033729000454, "loss": 0.0246, "step": 36980 }, { "epoch": 0.4, "learning_rate": 0.0002400175131348511, "loss": 0.0247, "step": 36990 }, { "epoch": 0.4, "learning_rate": 0.00024000129726924822, "loss": 0.0205, "step": 37000 }, { "epoch": 0.4, "eval_cer": 0.9216033715692354, "eval_loss": 0.01503350492566824, "eval_runtime": 121.5384, "eval_samples_per_second": 16.456, "eval_steps_per_second": 4.114, "step": 37000 }, { "epoch": 0.4, "learning_rate": 0.0002399850814036453, "loss": 0.0237, "step": 37010 }, { "epoch": 0.4, "learning_rate": 0.00023996886553804238, "loss": 0.019, "step": 37020 }, { "epoch": 0.4, "learning_rate": 0.0002399526496724395, "loss": 0.0214, "step": 37030 }, { "epoch": 0.4, "learning_rate": 0.0002399364338068366, "loss": 0.0213, "step": 37040 }, { "epoch": 0.4, "learning_rate": 0.00023992021794123368, "loss": 0.0224, "step": 37050 }, { "epoch": 0.4, "learning_rate": 0.00023990400207563078, "loss": 0.0223, "step": 37060 }, { "epoch": 0.4, "learning_rate": 0.00023988778621002787, "loss": 0.0258, "step": 37070 }, { "epoch": 0.4, "learning_rate": 0.00023987157034442496, "loss": 0.0233, "step": 37080 }, { "epoch": 0.4, "learning_rate": 0.00023985535447882208, "loss": 0.02, "step": 37090 }, { "epoch": 0.4, "learning_rate": 0.00023983913861321915, "loss": 0.0224, "step": 37100 }, { "epoch": 0.4, "learning_rate": 0.00023982292274761624, "loss": 0.0215, "step": 37110 }, { "epoch": 0.4, "learning_rate": 0.00023980670688201333, "loss": 0.0213, "step": 37120 }, { "epoch": 0.4, "learning_rate": 0.00023979049101641045, "loss": 0.0185, "step": 37130 }, { "epoch": 0.4, "learning_rate": 0.00023977427515080752, "loss": 0.0222, "step": 37140 }, { "epoch": 0.4, "learning_rate": 0.0002397580592852046, "loss": 0.0247, "step": 37150 }, { "epoch": 0.4, "learning_rate": 0.00023974184341960173, "loss": 0.0273, "step": 37160 }, { "epoch": 0.4, "learning_rate": 0.00023972562755399882, "loss": 0.0215, "step": 37170 }, { "epoch": 0.4, "learning_rate": 0.0002397094116883959, "loss": 0.0223, "step": 37180 }, { "epoch": 0.4, "learning_rate": 0.00023969319582279298, "loss": 0.0267, "step": 37190 }, { "epoch": 0.4, "learning_rate": 0.0002396769799571901, "loss": 0.0248, "step": 37200 }, { "epoch": 0.4, "learning_rate": 0.0002396607640915872, "loss": 0.0237, "step": 37210 }, { "epoch": 0.4, "learning_rate": 0.00023964454822598426, "loss": 0.0235, "step": 37220 }, { "epoch": 0.4, "learning_rate": 0.00023962833236038138, "loss": 0.0251, "step": 37230 }, { "epoch": 0.4, "learning_rate": 0.00023961211649477847, "loss": 0.0213, "step": 37240 }, { "epoch": 0.4, "learning_rate": 0.00023959590062917557, "loss": 0.0223, "step": 37250 }, { "epoch": 0.4, "learning_rate": 0.00023957968476357263, "loss": 0.0217, "step": 37260 }, { "epoch": 0.4, "learning_rate": 0.00023956346889796975, "loss": 0.025, "step": 37270 }, { "epoch": 0.4, "learning_rate": 0.00023954725303236684, "loss": 0.1174, "step": 37280 }, { "epoch": 0.4, "learning_rate": 0.00023953103716676396, "loss": 0.0407, "step": 37290 }, { "epoch": 0.4, "learning_rate": 0.00023951482130116103, "loss": 0.0245, "step": 37300 }, { "epoch": 0.4, "learning_rate": 0.00023949860543555812, "loss": 0.0299, "step": 37310 }, { "epoch": 0.4, "learning_rate": 0.00023948238956995522, "loss": 0.0321, "step": 37320 }, { "epoch": 0.4, "learning_rate": 0.00023946617370435233, "loss": 0.0268, "step": 37330 }, { "epoch": 0.4, "learning_rate": 0.0002394499578387494, "loss": 0.0201, "step": 37340 }, { "epoch": 0.4, "learning_rate": 0.0002394337419731465, "loss": 0.0222, "step": 37350 }, { "epoch": 0.4, "learning_rate": 0.0002394175261075436, "loss": 0.0215, "step": 37360 }, { "epoch": 0.4, "learning_rate": 0.0002394013102419407, "loss": 0.0193, "step": 37370 }, { "epoch": 0.4, "learning_rate": 0.00023938509437633777, "loss": 0.0235, "step": 37380 }, { "epoch": 0.4, "learning_rate": 0.00023936887851073486, "loss": 0.0192, "step": 37390 }, { "epoch": 0.4, "learning_rate": 0.00023935266264513198, "loss": 0.0294, "step": 37400 }, { "epoch": 0.4, "learning_rate": 0.00023933644677952908, "loss": 0.0462, "step": 37410 }, { "epoch": 0.4, "learning_rate": 0.00023932023091392617, "loss": 0.0237, "step": 37420 }, { "epoch": 0.4, "learning_rate": 0.00023930401504832326, "loss": 0.0236, "step": 37430 }, { "epoch": 0.4, "learning_rate": 0.00023928779918272036, "loss": 0.0269, "step": 37440 }, { "epoch": 0.4, "learning_rate": 0.00023927158331711745, "loss": 0.0191, "step": 37450 }, { "epoch": 0.4, "learning_rate": 0.00023925536745151457, "loss": 0.022, "step": 37460 }, { "epoch": 0.41, "learning_rate": 0.00023923915158591163, "loss": 0.0244, "step": 37470 }, { "epoch": 0.41, "learning_rate": 0.00023922293572030873, "loss": 0.0211, "step": 37480 }, { "epoch": 0.41, "learning_rate": 0.00023920671985470582, "loss": 0.0215, "step": 37490 }, { "epoch": 0.41, "learning_rate": 0.00023919050398910294, "loss": 0.0221, "step": 37500 }, { "epoch": 0.41, "learning_rate": 0.0002391742881235, "loss": 0.0211, "step": 37510 }, { "epoch": 0.41, "learning_rate": 0.0002391580722578971, "loss": 0.0239, "step": 37520 }, { "epoch": 0.41, "learning_rate": 0.00023914185639229422, "loss": 0.0172, "step": 37530 }, { "epoch": 0.41, "learning_rate": 0.0002391256405266913, "loss": 0.0204, "step": 37540 }, { "epoch": 0.41, "learning_rate": 0.00023910942466108838, "loss": 0.0186, "step": 37550 }, { "epoch": 0.41, "learning_rate": 0.00023909320879548547, "loss": 0.0206, "step": 37560 }, { "epoch": 0.41, "learning_rate": 0.0002390769929298826, "loss": 0.0233, "step": 37570 }, { "epoch": 0.41, "learning_rate": 0.00023906077706427968, "loss": 0.0221, "step": 37580 }, { "epoch": 0.41, "learning_rate": 0.00023904456119867675, "loss": 0.0168, "step": 37590 }, { "epoch": 0.41, "learning_rate": 0.00023902834533307387, "loss": 0.0237, "step": 37600 }, { "epoch": 0.41, "learning_rate": 0.00023901212946747096, "loss": 0.0144, "step": 37610 }, { "epoch": 0.41, "learning_rate": 0.00023899591360186805, "loss": 0.022, "step": 37620 }, { "epoch": 0.41, "learning_rate": 0.00023897969773626512, "loss": 0.0202, "step": 37630 }, { "epoch": 0.41, "learning_rate": 0.00023896348187066224, "loss": 0.0218, "step": 37640 }, { "epoch": 0.41, "learning_rate": 0.00023894726600505933, "loss": 0.0204, "step": 37650 }, { "epoch": 0.41, "learning_rate": 0.00023893105013945645, "loss": 0.0209, "step": 37660 }, { "epoch": 0.41, "learning_rate": 0.00023891483427385352, "loss": 0.0199, "step": 37670 }, { "epoch": 0.41, "learning_rate": 0.0002388986184082506, "loss": 0.0183, "step": 37680 }, { "epoch": 0.41, "learning_rate": 0.0002388824025426477, "loss": 0.0211, "step": 37690 }, { "epoch": 0.41, "learning_rate": 0.00023886618667704482, "loss": 0.0228, "step": 37700 }, { "epoch": 0.41, "learning_rate": 0.00023884997081144189, "loss": 0.0188, "step": 37710 }, { "epoch": 0.41, "learning_rate": 0.00023883375494583898, "loss": 0.0198, "step": 37720 }, { "epoch": 0.41, "learning_rate": 0.0002388175390802361, "loss": 0.0211, "step": 37730 }, { "epoch": 0.41, "learning_rate": 0.0002388013232146332, "loss": 0.0256, "step": 37740 }, { "epoch": 0.41, "learning_rate": 0.00023878510734903026, "loss": 0.0202, "step": 37750 }, { "epoch": 0.41, "learning_rate": 0.00023876889148342735, "loss": 0.0174, "step": 37760 }, { "epoch": 0.41, "learning_rate": 0.00023875267561782447, "loss": 0.0242, "step": 37770 }, { "epoch": 0.41, "learning_rate": 0.00023873645975222156, "loss": 0.0234, "step": 37780 }, { "epoch": 0.41, "learning_rate": 0.00023872024388661863, "loss": 0.0192, "step": 37790 }, { "epoch": 0.41, "learning_rate": 0.00023870402802101575, "loss": 0.0211, "step": 37800 }, { "epoch": 0.41, "learning_rate": 0.00023868781215541284, "loss": 0.0225, "step": 37810 }, { "epoch": 0.41, "learning_rate": 0.00023867159628980993, "loss": 0.0218, "step": 37820 }, { "epoch": 0.41, "learning_rate": 0.000238655380424207, "loss": 0.0211, "step": 37830 }, { "epoch": 0.41, "learning_rate": 0.00023863916455860412, "loss": 0.0178, "step": 37840 }, { "epoch": 0.41, "learning_rate": 0.0002386229486930012, "loss": 0.0214, "step": 37850 }, { "epoch": 0.41, "learning_rate": 0.0002386067328273983, "loss": 0.0209, "step": 37860 }, { "epoch": 0.41, "learning_rate": 0.0002385905169617954, "loss": 0.0224, "step": 37870 }, { "epoch": 0.41, "learning_rate": 0.0002385743010961925, "loss": 0.0331, "step": 37880 }, { "epoch": 0.41, "learning_rate": 0.00023855808523058958, "loss": 0.0294, "step": 37890 }, { "epoch": 0.41, "learning_rate": 0.0002385418693649867, "loss": 0.0195, "step": 37900 }, { "epoch": 0.41, "learning_rate": 0.00023852565349938377, "loss": 0.0237, "step": 37910 }, { "epoch": 0.41, "learning_rate": 0.00023850943763378086, "loss": 0.0203, "step": 37920 }, { "epoch": 0.41, "learning_rate": 0.00023849322176817795, "loss": 0.0192, "step": 37930 }, { "epoch": 0.41, "learning_rate": 0.00023847700590257507, "loss": 0.0179, "step": 37940 }, { "epoch": 0.41, "learning_rate": 0.00023846079003697214, "loss": 0.019, "step": 37950 }, { "epoch": 0.41, "learning_rate": 0.00023844457417136923, "loss": 0.0196, "step": 37960 }, { "epoch": 0.41, "learning_rate": 0.00023842835830576635, "loss": 0.0184, "step": 37970 }, { "epoch": 0.41, "learning_rate": 0.00023841214244016344, "loss": 0.0213, "step": 37980 }, { "epoch": 0.41, "learning_rate": 0.0002383959265745605, "loss": 0.0268, "step": 37990 }, { "epoch": 0.41, "learning_rate": 0.0002383797107089576, "loss": 0.0197, "step": 38000 }, { "epoch": 0.41, "eval_cer": 0.9215773134805442, "eval_loss": 0.015152968466281891, "eval_runtime": 121.8268, "eval_samples_per_second": 16.417, "eval_steps_per_second": 4.104, "step": 38000 }, { "epoch": 0.41, "learning_rate": 0.00023836349484335472, "loss": 0.0217, "step": 38010 }, { "epoch": 0.41, "learning_rate": 0.00023834727897775182, "loss": 0.0196, "step": 38020 }, { "epoch": 0.41, "learning_rate": 0.00023833106311214888, "loss": 0.0226, "step": 38030 }, { "epoch": 0.41, "learning_rate": 0.000238314847246546, "loss": 0.0194, "step": 38040 }, { "epoch": 0.41, "learning_rate": 0.0002382986313809431, "loss": 0.0182, "step": 38050 }, { "epoch": 0.41, "learning_rate": 0.0002382824155153402, "loss": 0.0312, "step": 38060 }, { "epoch": 0.41, "learning_rate": 0.00023826619964973728, "loss": 0.0229, "step": 38070 }, { "epoch": 0.41, "learning_rate": 0.00023824998378413437, "loss": 0.0219, "step": 38080 }, { "epoch": 0.41, "learning_rate": 0.00023823376791853146, "loss": 0.0211, "step": 38090 }, { "epoch": 0.41, "learning_rate": 0.00023821755205292858, "loss": 0.0189, "step": 38100 }, { "epoch": 0.41, "learning_rate": 0.00023820133618732565, "loss": 0.021, "step": 38110 }, { "epoch": 0.41, "learning_rate": 0.00023818512032172274, "loss": 0.0173, "step": 38120 }, { "epoch": 0.41, "learning_rate": 0.00023816890445611984, "loss": 0.0245, "step": 38130 }, { "epoch": 0.41, "learning_rate": 0.00023815268859051696, "loss": 0.0225, "step": 38140 }, { "epoch": 0.41, "learning_rate": 0.00023813647272491405, "loss": 0.0223, "step": 38150 }, { "epoch": 0.41, "learning_rate": 0.00023812025685931111, "loss": 0.0241, "step": 38160 }, { "epoch": 0.41, "learning_rate": 0.00023810404099370823, "loss": 0.0209, "step": 38170 }, { "epoch": 0.41, "learning_rate": 0.00023808782512810533, "loss": 0.0235, "step": 38180 }, { "epoch": 0.41, "learning_rate": 0.00023807160926250242, "loss": 0.023, "step": 38190 }, { "epoch": 0.41, "learning_rate": 0.00023805539339689948, "loss": 0.021, "step": 38200 }, { "epoch": 0.41, "learning_rate": 0.0002380391775312966, "loss": 0.0235, "step": 38210 }, { "epoch": 0.41, "learning_rate": 0.0002380229616656937, "loss": 0.0196, "step": 38220 }, { "epoch": 0.41, "learning_rate": 0.0002380067458000908, "loss": 0.0236, "step": 38230 }, { "epoch": 0.41, "learning_rate": 0.00023799052993448788, "loss": 0.0208, "step": 38240 }, { "epoch": 0.41, "learning_rate": 0.00023797431406888498, "loss": 0.0211, "step": 38250 }, { "epoch": 0.41, "learning_rate": 0.00023795809820328207, "loss": 0.021, "step": 38260 }, { "epoch": 0.41, "learning_rate": 0.0002379418823376792, "loss": 0.018, "step": 38270 }, { "epoch": 0.41, "learning_rate": 0.00023792566647207625, "loss": 0.0188, "step": 38280 }, { "epoch": 0.41, "learning_rate": 0.00023790945060647335, "loss": 0.0192, "step": 38290 }, { "epoch": 0.41, "learning_rate": 0.00023789323474087047, "loss": 0.0199, "step": 38300 }, { "epoch": 0.41, "learning_rate": 0.00023787701887526756, "loss": 0.0231, "step": 38310 }, { "epoch": 0.41, "learning_rate": 0.00023786080300966462, "loss": 0.0208, "step": 38320 }, { "epoch": 0.41, "learning_rate": 0.00023784458714406172, "loss": 0.0179, "step": 38330 }, { "epoch": 0.41, "learning_rate": 0.00023782837127845884, "loss": 0.0203, "step": 38340 }, { "epoch": 0.41, "learning_rate": 0.00023781215541285593, "loss": 0.0209, "step": 38350 }, { "epoch": 0.41, "learning_rate": 0.000237795939547253, "loss": 0.022, "step": 38360 }, { "epoch": 0.41, "learning_rate": 0.00023777972368165012, "loss": 0.0221, "step": 38370 }, { "epoch": 0.41, "learning_rate": 0.0002377635078160472, "loss": 0.0196, "step": 38380 }, { "epoch": 0.42, "learning_rate": 0.0002377472919504443, "loss": 0.0163, "step": 38390 }, { "epoch": 0.42, "learning_rate": 0.00023773107608484137, "loss": 0.0232, "step": 38400 }, { "epoch": 0.42, "learning_rate": 0.0002377148602192385, "loss": 0.021, "step": 38410 }, { "epoch": 0.42, "learning_rate": 0.00023769864435363558, "loss": 0.0195, "step": 38420 }, { "epoch": 0.42, "learning_rate": 0.00023768242848803267, "loss": 0.0216, "step": 38430 }, { "epoch": 0.42, "learning_rate": 0.00023766621262242977, "loss": 0.0225, "step": 38440 }, { "epoch": 0.42, "learning_rate": 0.00023764999675682686, "loss": 0.0279, "step": 38450 }, { "epoch": 0.42, "learning_rate": 0.00023763378089122395, "loss": 0.025, "step": 38460 }, { "epoch": 0.42, "learning_rate": 0.00023761756502562107, "loss": 0.0254, "step": 38470 }, { "epoch": 0.42, "learning_rate": 0.00023760134916001814, "loss": 0.0207, "step": 38480 }, { "epoch": 0.42, "learning_rate": 0.00023758513329441523, "loss": 0.0201, "step": 38490 }, { "epoch": 0.42, "learning_rate": 0.00023756891742881232, "loss": 0.0191, "step": 38500 }, { "epoch": 0.42, "learning_rate": 0.00023755270156320944, "loss": 0.0225, "step": 38510 }, { "epoch": 0.42, "learning_rate": 0.0002375364856976065, "loss": 0.019, "step": 38520 }, { "epoch": 0.42, "learning_rate": 0.0002375202698320036, "loss": 0.0216, "step": 38530 }, { "epoch": 0.42, "learning_rate": 0.00023750405396640072, "loss": 0.0208, "step": 38540 }, { "epoch": 0.42, "learning_rate": 0.0002374878381007978, "loss": 0.0179, "step": 38550 }, { "epoch": 0.42, "learning_rate": 0.00023747162223519488, "loss": 0.0179, "step": 38560 }, { "epoch": 0.42, "learning_rate": 0.00023745540636959197, "loss": 0.0233, "step": 38570 }, { "epoch": 0.42, "learning_rate": 0.0002374391905039891, "loss": 0.0192, "step": 38580 }, { "epoch": 0.42, "learning_rate": 0.00023742297463838618, "loss": 0.019, "step": 38590 }, { "epoch": 0.42, "learning_rate": 0.00023740675877278325, "loss": 0.0243, "step": 38600 }, { "epoch": 0.42, "learning_rate": 0.00023739054290718037, "loss": 0.0169, "step": 38610 }, { "epoch": 0.42, "learning_rate": 0.00023737432704157746, "loss": 0.0207, "step": 38620 }, { "epoch": 0.42, "learning_rate": 0.00023735811117597455, "loss": 0.0208, "step": 38630 }, { "epoch": 0.42, "learning_rate": 0.00023734189531037162, "loss": 0.0176, "step": 38640 }, { "epoch": 0.42, "learning_rate": 0.00023732567944476874, "loss": 0.0203, "step": 38650 }, { "epoch": 0.42, "learning_rate": 0.00023730946357916583, "loss": 0.0159, "step": 38660 }, { "epoch": 0.42, "learning_rate": 0.00023729324771356295, "loss": 0.0198, "step": 38670 }, { "epoch": 0.42, "learning_rate": 0.00023727703184796002, "loss": 0.0217, "step": 38680 }, { "epoch": 0.42, "learning_rate": 0.0002372608159823571, "loss": 0.0208, "step": 38690 }, { "epoch": 0.42, "learning_rate": 0.0002372446001167542, "loss": 0.0206, "step": 38700 }, { "epoch": 0.42, "learning_rate": 0.00023722838425115132, "loss": 0.0202, "step": 38710 }, { "epoch": 0.42, "learning_rate": 0.0002372121683855484, "loss": 0.0187, "step": 38720 }, { "epoch": 0.42, "learning_rate": 0.00023719595251994548, "loss": 0.0183, "step": 38730 }, { "epoch": 0.42, "learning_rate": 0.0002371797366543426, "loss": 0.0178, "step": 38740 }, { "epoch": 0.42, "learning_rate": 0.0002371635207887397, "loss": 0.0192, "step": 38750 }, { "epoch": 0.42, "learning_rate": 0.00023714730492313676, "loss": 0.0179, "step": 38760 }, { "epoch": 0.42, "learning_rate": 0.00023713108905753385, "loss": 0.0188, "step": 38770 }, { "epoch": 0.42, "learning_rate": 0.00023711487319193097, "loss": 0.0198, "step": 38780 }, { "epoch": 0.42, "learning_rate": 0.00023709865732632807, "loss": 0.0193, "step": 38790 }, { "epoch": 0.42, "learning_rate": 0.00023708244146072513, "loss": 0.0226, "step": 38800 }, { "epoch": 0.42, "learning_rate": 0.00023706622559512225, "loss": 0.0213, "step": 38810 }, { "epoch": 0.42, "learning_rate": 0.00023705000972951934, "loss": 0.0194, "step": 38820 }, { "epoch": 0.42, "learning_rate": 0.00023703379386391644, "loss": 0.0186, "step": 38830 }, { "epoch": 0.42, "learning_rate": 0.0002370175779983135, "loss": 0.0243, "step": 38840 }, { "epoch": 0.42, "learning_rate": 0.00023700136213271062, "loss": 0.0216, "step": 38850 }, { "epoch": 0.42, "learning_rate": 0.00023698514626710771, "loss": 0.0252, "step": 38860 }, { "epoch": 0.42, "learning_rate": 0.0002369689304015048, "loss": 0.0192, "step": 38870 }, { "epoch": 0.42, "learning_rate": 0.00023695271453590193, "loss": 0.0432, "step": 38880 }, { "epoch": 0.42, "learning_rate": 0.000236936498670299, "loss": 0.023, "step": 38890 }, { "epoch": 0.42, "learning_rate": 0.00023692028280469609, "loss": 0.0287, "step": 38900 }, { "epoch": 0.42, "learning_rate": 0.0002369040669390932, "loss": 0.0181, "step": 38910 }, { "epoch": 0.42, "learning_rate": 0.0002368878510734903, "loss": 0.0276, "step": 38920 }, { "epoch": 0.42, "learning_rate": 0.00023687163520788736, "loss": 0.0228, "step": 38930 }, { "epoch": 0.42, "learning_rate": 0.00023685541934228446, "loss": 0.0212, "step": 38940 }, { "epoch": 0.42, "learning_rate": 0.00023683920347668158, "loss": 0.0209, "step": 38950 }, { "epoch": 0.42, "learning_rate": 0.00023682298761107867, "loss": 0.0226, "step": 38960 }, { "epoch": 0.42, "learning_rate": 0.00023680677174547573, "loss": 0.0214, "step": 38970 }, { "epoch": 0.42, "learning_rate": 0.00023679055587987285, "loss": 0.022, "step": 38980 }, { "epoch": 0.42, "learning_rate": 0.00023677434001426995, "loss": 0.0209, "step": 38990 }, { "epoch": 0.42, "learning_rate": 0.00023675812414866704, "loss": 0.0205, "step": 39000 }, { "epoch": 0.42, "eval_cer": 0.9215512553918529, "eval_loss": 0.015001688152551651, "eval_runtime": 121.88, "eval_samples_per_second": 16.41, "eval_steps_per_second": 4.102, "step": 39000 }, { "epoch": 0.42, "learning_rate": 0.0002367419082830641, "loss": 0.023, "step": 39010 }, { "epoch": 0.42, "learning_rate": 0.00023672569241746123, "loss": 0.0193, "step": 39020 }, { "epoch": 0.42, "learning_rate": 0.00023670947655185832, "loss": 0.0212, "step": 39030 }, { "epoch": 0.42, "learning_rate": 0.00023669326068625544, "loss": 0.0204, "step": 39040 }, { "epoch": 0.42, "learning_rate": 0.0002366770448206525, "loss": 0.0246, "step": 39050 }, { "epoch": 0.42, "learning_rate": 0.0002366608289550496, "loss": 0.0227, "step": 39060 }, { "epoch": 0.42, "learning_rate": 0.0002366446130894467, "loss": 0.0311, "step": 39070 }, { "epoch": 0.42, "learning_rate": 0.0002366283972238438, "loss": 0.0237, "step": 39080 }, { "epoch": 0.42, "learning_rate": 0.00023661218135824087, "loss": 0.0214, "step": 39090 }, { "epoch": 0.42, "learning_rate": 0.00023659596549263797, "loss": 0.0207, "step": 39100 }, { "epoch": 0.42, "learning_rate": 0.0002365797496270351, "loss": 0.0198, "step": 39110 }, { "epoch": 0.42, "learning_rate": 0.00023656353376143218, "loss": 0.0235, "step": 39120 }, { "epoch": 0.42, "learning_rate": 0.00023654731789582925, "loss": 0.0217, "step": 39130 }, { "epoch": 0.42, "learning_rate": 0.00023653110203022634, "loss": 0.0222, "step": 39140 }, { "epoch": 0.42, "learning_rate": 0.00023651488616462346, "loss": 0.0196, "step": 39150 }, { "epoch": 0.42, "learning_rate": 0.00023649867029902055, "loss": 0.019, "step": 39160 }, { "epoch": 0.42, "learning_rate": 0.00023648245443341762, "loss": 0.0188, "step": 39170 }, { "epoch": 0.42, "learning_rate": 0.00023646623856781474, "loss": 0.0175, "step": 39180 }, { "epoch": 0.42, "learning_rate": 0.00023645002270221183, "loss": 0.0186, "step": 39190 }, { "epoch": 0.42, "learning_rate": 0.00023643380683660892, "loss": 0.0216, "step": 39200 }, { "epoch": 0.42, "learning_rate": 0.000236417590971006, "loss": 0.0211, "step": 39210 }, { "epoch": 0.42, "learning_rate": 0.0002364013751054031, "loss": 0.0211, "step": 39220 }, { "epoch": 0.42, "learning_rate": 0.0002363851592398002, "loss": 0.0213, "step": 39230 }, { "epoch": 0.42, "learning_rate": 0.0002363689433741973, "loss": 0.0174, "step": 39240 }, { "epoch": 0.42, "learning_rate": 0.00023635272750859439, "loss": 0.0237, "step": 39250 }, { "epoch": 0.42, "learning_rate": 0.00023633651164299148, "loss": 0.0222, "step": 39260 }, { "epoch": 0.42, "learning_rate": 0.00023632029577738857, "loss": 0.0244, "step": 39270 }, { "epoch": 0.42, "learning_rate": 0.0002363040799117857, "loss": 0.0227, "step": 39280 }, { "epoch": 0.42, "learning_rate": 0.00023628786404618276, "loss": 0.021, "step": 39290 }, { "epoch": 0.42, "learning_rate": 0.00023627164818057985, "loss": 0.0199, "step": 39300 }, { "epoch": 0.42, "learning_rate": 0.00023625543231497697, "loss": 0.0252, "step": 39310 }, { "epoch": 0.43, "learning_rate": 0.00023623921644937406, "loss": 0.0207, "step": 39320 }, { "epoch": 0.43, "learning_rate": 0.00023622300058377113, "loss": 0.0176, "step": 39330 }, { "epoch": 0.43, "learning_rate": 0.00023620678471816822, "loss": 0.0172, "step": 39340 }, { "epoch": 0.43, "learning_rate": 0.00023619056885256534, "loss": 0.0185, "step": 39350 }, { "epoch": 0.43, "learning_rate": 0.00023617435298696243, "loss": 0.0217, "step": 39360 }, { "epoch": 0.43, "learning_rate": 0.0002361581371213595, "loss": 0.0213, "step": 39370 }, { "epoch": 0.43, "learning_rate": 0.00023614192125575662, "loss": 0.0216, "step": 39380 }, { "epoch": 0.43, "learning_rate": 0.0002361257053901537, "loss": 0.0249, "step": 39390 }, { "epoch": 0.43, "learning_rate": 0.0002361094895245508, "loss": 0.018, "step": 39400 }, { "epoch": 0.43, "learning_rate": 0.00023609327365894787, "loss": 0.0177, "step": 39410 }, { "epoch": 0.43, "learning_rate": 0.000236077057793345, "loss": 0.0187, "step": 39420 }, { "epoch": 0.43, "learning_rate": 0.00023606084192774208, "loss": 0.0182, "step": 39430 }, { "epoch": 0.43, "learning_rate": 0.00023604462606213917, "loss": 0.0185, "step": 39440 }, { "epoch": 0.43, "learning_rate": 0.00023602841019653627, "loss": 0.0198, "step": 39450 }, { "epoch": 0.43, "learning_rate": 0.00023601219433093336, "loss": 0.0226, "step": 39460 }, { "epoch": 0.43, "learning_rate": 0.00023599597846533045, "loss": 0.0199, "step": 39470 }, { "epoch": 0.43, "learning_rate": 0.00023597976259972757, "loss": 0.0217, "step": 39480 }, { "epoch": 0.43, "learning_rate": 0.00023596354673412464, "loss": 0.0228, "step": 39490 }, { "epoch": 0.43, "learning_rate": 0.00023594733086852173, "loss": 0.0198, "step": 39500 }, { "epoch": 0.43, "learning_rate": 0.00023593111500291882, "loss": 0.0179, "step": 39510 }, { "epoch": 0.43, "learning_rate": 0.00023591489913731594, "loss": 0.0168, "step": 39520 }, { "epoch": 0.43, "learning_rate": 0.000235898683271713, "loss": 0.0223, "step": 39530 }, { "epoch": 0.43, "learning_rate": 0.0002358824674061101, "loss": 0.0182, "step": 39540 }, { "epoch": 0.43, "learning_rate": 0.00023586625154050722, "loss": 0.0222, "step": 39550 }, { "epoch": 0.43, "learning_rate": 0.00023585003567490431, "loss": 0.023, "step": 39560 }, { "epoch": 0.43, "learning_rate": 0.0002358338198093014, "loss": 0.0185, "step": 39570 }, { "epoch": 0.43, "learning_rate": 0.00023581760394369847, "loss": 0.0194, "step": 39580 }, { "epoch": 0.43, "learning_rate": 0.0002358013880780956, "loss": 0.0204, "step": 39590 }, { "epoch": 0.43, "learning_rate": 0.00023578517221249269, "loss": 0.02, "step": 39600 }, { "epoch": 0.43, "learning_rate": 0.0002357689563468898, "loss": 0.0204, "step": 39610 }, { "epoch": 0.43, "learning_rate": 0.00023575274048128687, "loss": 0.0213, "step": 39620 }, { "epoch": 0.43, "learning_rate": 0.00023573652461568396, "loss": 0.021, "step": 39630 }, { "epoch": 0.43, "learning_rate": 0.00023572030875008106, "loss": 0.0179, "step": 39640 }, { "epoch": 0.43, "learning_rate": 0.00023570409288447818, "loss": 0.0236, "step": 39650 }, { "epoch": 0.43, "learning_rate": 0.00023568787701887524, "loss": 0.0178, "step": 39660 }, { "epoch": 0.43, "learning_rate": 0.00023567166115327234, "loss": 0.0217, "step": 39670 }, { "epoch": 0.43, "learning_rate": 0.00023565544528766945, "loss": 0.0209, "step": 39680 }, { "epoch": 0.43, "learning_rate": 0.00023563922942206655, "loss": 0.0222, "step": 39690 }, { "epoch": 0.43, "learning_rate": 0.0002356230135564636, "loss": 0.0202, "step": 39700 }, { "epoch": 0.43, "learning_rate": 0.0002356067976908607, "loss": 0.0222, "step": 39710 }, { "epoch": 0.43, "learning_rate": 0.00023559058182525783, "loss": 0.0186, "step": 39720 }, { "epoch": 0.43, "learning_rate": 0.00023557436595965492, "loss": 0.0224, "step": 39730 }, { "epoch": 0.43, "learning_rate": 0.00023555815009405198, "loss": 0.0196, "step": 39740 }, { "epoch": 0.43, "learning_rate": 0.0002355419342284491, "loss": 0.0227, "step": 39750 }, { "epoch": 0.43, "learning_rate": 0.0002355257183628462, "loss": 0.0238, "step": 39760 }, { "epoch": 0.43, "learning_rate": 0.0002355095024972433, "loss": 0.0206, "step": 39770 }, { "epoch": 0.43, "learning_rate": 0.00023549328663164036, "loss": 0.02, "step": 39780 }, { "epoch": 0.43, "learning_rate": 0.00023547707076603748, "loss": 0.022, "step": 39790 }, { "epoch": 0.43, "learning_rate": 0.00023546085490043457, "loss": 0.0172, "step": 39800 }, { "epoch": 0.43, "learning_rate": 0.00023544463903483166, "loss": 0.02, "step": 39810 }, { "epoch": 0.43, "learning_rate": 0.00023542842316922875, "loss": 0.0192, "step": 39820 }, { "epoch": 0.43, "learning_rate": 0.00023541220730362585, "loss": 0.017, "step": 39830 }, { "epoch": 0.43, "learning_rate": 0.00023539599143802294, "loss": 0.0148, "step": 39840 }, { "epoch": 0.43, "learning_rate": 0.00023537977557242006, "loss": 0.0198, "step": 39850 }, { "epoch": 0.43, "learning_rate": 0.00023536355970681712, "loss": 0.0224, "step": 39860 }, { "epoch": 0.43, "learning_rate": 0.00023534734384121422, "loss": 0.0195, "step": 39870 }, { "epoch": 0.43, "learning_rate": 0.0002353311279756113, "loss": 0.0172, "step": 39880 }, { "epoch": 0.43, "learning_rate": 0.00023531491211000843, "loss": 0.0221, "step": 39890 }, { "epoch": 0.43, "learning_rate": 0.0002352986962444055, "loss": 0.0248, "step": 39900 }, { "epoch": 0.43, "learning_rate": 0.0002352824803788026, "loss": 0.0184, "step": 39910 }, { "epoch": 0.43, "learning_rate": 0.0002352662645131997, "loss": 0.0217, "step": 39920 }, { "epoch": 0.43, "learning_rate": 0.0002352500486475968, "loss": 0.0192, "step": 39930 }, { "epoch": 0.43, "learning_rate": 0.00023523383278199387, "loss": 0.0193, "step": 39940 }, { "epoch": 0.43, "learning_rate": 0.00023521761691639096, "loss": 0.0189, "step": 39950 }, { "epoch": 0.43, "learning_rate": 0.00023520140105078808, "loss": 0.0236, "step": 39960 }, { "epoch": 0.43, "learning_rate": 0.00023518518518518517, "loss": 0.0185, "step": 39970 }, { "epoch": 0.43, "learning_rate": 0.00023516896931958224, "loss": 0.0198, "step": 39980 }, { "epoch": 0.43, "learning_rate": 0.00023515275345397936, "loss": 0.0213, "step": 39990 }, { "epoch": 0.43, "learning_rate": 0.00023513653758837645, "loss": 0.0182, "step": 40000 }, { "epoch": 0.43, "eval_cer": 0.9215938169367153, "eval_loss": 0.014509420841932297, "eval_runtime": 121.8906, "eval_samples_per_second": 16.408, "eval_steps_per_second": 4.102, "step": 40000 }, { "epoch": 0.43, "learning_rate": 0.00023512032172277354, "loss": 0.0186, "step": 40010 }, { "epoch": 0.43, "learning_rate": 0.0002351041058571706, "loss": 0.0214, "step": 40020 }, { "epoch": 0.43, "learning_rate": 0.00023508788999156773, "loss": 0.0202, "step": 40030 }, { "epoch": 0.43, "learning_rate": 0.00023507167412596482, "loss": 0.0185, "step": 40040 }, { "epoch": 0.43, "learning_rate": 0.00023505545826036194, "loss": 0.024, "step": 40050 }, { "epoch": 0.43, "learning_rate": 0.000235039242394759, "loss": 0.0195, "step": 40060 }, { "epoch": 0.43, "learning_rate": 0.0002350230265291561, "loss": 0.0197, "step": 40070 }, { "epoch": 0.43, "learning_rate": 0.0002350068106635532, "loss": 0.0217, "step": 40080 }, { "epoch": 0.43, "learning_rate": 0.0002349905947979503, "loss": 0.0215, "step": 40090 }, { "epoch": 0.43, "learning_rate": 0.00023497437893234738, "loss": 0.0195, "step": 40100 }, { "epoch": 0.43, "learning_rate": 0.00023495816306674447, "loss": 0.0196, "step": 40110 }, { "epoch": 0.43, "learning_rate": 0.0002349419472011416, "loss": 0.0216, "step": 40120 }, { "epoch": 0.43, "learning_rate": 0.00023492573133553868, "loss": 0.0202, "step": 40130 }, { "epoch": 0.43, "learning_rate": 0.00023490951546993575, "loss": 0.0205, "step": 40140 }, { "epoch": 0.43, "learning_rate": 0.00023489329960433284, "loss": 0.0182, "step": 40150 }, { "epoch": 0.43, "learning_rate": 0.00023487708373872996, "loss": 0.0185, "step": 40160 }, { "epoch": 0.43, "learning_rate": 0.00023486086787312705, "loss": 0.023, "step": 40170 }, { "epoch": 0.43, "learning_rate": 0.00023484465200752412, "loss": 0.0208, "step": 40180 }, { "epoch": 0.43, "learning_rate": 0.00023482843614192124, "loss": 0.0199, "step": 40190 }, { "epoch": 0.43, "learning_rate": 0.00023481222027631833, "loss": 0.02, "step": 40200 }, { "epoch": 0.43, "learning_rate": 0.00023479600441071542, "loss": 0.0195, "step": 40210 }, { "epoch": 0.43, "learning_rate": 0.0002347797885451125, "loss": 0.0197, "step": 40220 }, { "epoch": 0.43, "learning_rate": 0.0002347635726795096, "loss": 0.0222, "step": 40230 }, { "epoch": 0.44, "learning_rate": 0.0002347473568139067, "loss": 0.0182, "step": 40240 }, { "epoch": 0.44, "learning_rate": 0.0002347311409483038, "loss": 0.0195, "step": 40250 }, { "epoch": 0.44, "learning_rate": 0.0002347149250827009, "loss": 0.0229, "step": 40260 }, { "epoch": 0.44, "learning_rate": 0.00023469870921709798, "loss": 0.0211, "step": 40270 }, { "epoch": 0.44, "learning_rate": 0.00023468249335149507, "loss": 0.0191, "step": 40280 }, { "epoch": 0.44, "learning_rate": 0.0002346662774858922, "loss": 0.0169, "step": 40290 }, { "epoch": 0.44, "learning_rate": 0.00023465006162028929, "loss": 0.0205, "step": 40300 }, { "epoch": 0.44, "learning_rate": 0.00023463384575468635, "loss": 0.0188, "step": 40310 }, { "epoch": 0.44, "learning_rate": 0.00023461762988908344, "loss": 0.0209, "step": 40320 }, { "epoch": 0.44, "learning_rate": 0.00023460141402348056, "loss": 0.0269, "step": 40330 }, { "epoch": 0.44, "learning_rate": 0.00023458519815787766, "loss": 0.0203, "step": 40340 }, { "epoch": 0.44, "learning_rate": 0.00023456898229227472, "loss": 0.0227, "step": 40350 }, { "epoch": 0.44, "learning_rate": 0.00023455276642667184, "loss": 0.021, "step": 40360 }, { "epoch": 0.44, "learning_rate": 0.00023453655056106894, "loss": 0.0208, "step": 40370 }, { "epoch": 0.44, "learning_rate": 0.00023452033469546603, "loss": 0.0215, "step": 40380 }, { "epoch": 0.44, "learning_rate": 0.00023450411882986312, "loss": 0.0241, "step": 40390 }, { "epoch": 0.44, "learning_rate": 0.00023448790296426021, "loss": 0.0172, "step": 40400 }, { "epoch": 0.44, "learning_rate": 0.0002344716870986573, "loss": 0.0197, "step": 40410 }, { "epoch": 0.44, "learning_rate": 0.00023445547123305443, "loss": 0.0281, "step": 40420 }, { "epoch": 0.44, "learning_rate": 0.0002344392553674515, "loss": 0.0206, "step": 40430 }, { "epoch": 0.44, "learning_rate": 0.00023442303950184858, "loss": 0.0336, "step": 40440 }, { "epoch": 0.44, "learning_rate": 0.00023440682363624568, "loss": 0.0243, "step": 40450 }, { "epoch": 0.44, "learning_rate": 0.0002343906077706428, "loss": 0.0297, "step": 40460 }, { "epoch": 0.44, "learning_rate": 0.00023437439190503986, "loss": 0.0227, "step": 40470 }, { "epoch": 0.44, "learning_rate": 0.00023435817603943696, "loss": 0.037, "step": 40480 }, { "epoch": 0.44, "learning_rate": 0.00023434196017383408, "loss": 0.0193, "step": 40490 }, { "epoch": 0.44, "learning_rate": 0.00023432574430823117, "loss": 0.0221, "step": 40500 }, { "epoch": 0.44, "learning_rate": 0.00023430952844262823, "loss": 0.0623, "step": 40510 }, { "epoch": 0.44, "learning_rate": 0.00023429331257702533, "loss": 0.0249, "step": 40520 }, { "epoch": 0.44, "learning_rate": 0.00023427709671142245, "loss": 0.0252, "step": 40530 }, { "epoch": 0.44, "learning_rate": 0.00023426088084581954, "loss": 0.0206, "step": 40540 }, { "epoch": 0.44, "learning_rate": 0.0002342446649802166, "loss": 0.0181, "step": 40550 }, { "epoch": 0.44, "learning_rate": 0.00023422844911461372, "loss": 0.022, "step": 40560 }, { "epoch": 0.44, "learning_rate": 0.00023421223324901082, "loss": 0.0218, "step": 40570 }, { "epoch": 0.44, "learning_rate": 0.0002341960173834079, "loss": 0.0209, "step": 40580 }, { "epoch": 0.44, "learning_rate": 0.00023417980151780498, "loss": 0.0193, "step": 40590 }, { "epoch": 0.44, "learning_rate": 0.0002341635856522021, "loss": 0.0185, "step": 40600 }, { "epoch": 0.44, "learning_rate": 0.0002341473697865992, "loss": 0.0218, "step": 40610 }, { "epoch": 0.44, "learning_rate": 0.0002341311539209963, "loss": 0.021, "step": 40620 }, { "epoch": 0.44, "learning_rate": 0.00023411493805539337, "loss": 0.0228, "step": 40630 }, { "epoch": 0.44, "learning_rate": 0.00023409872218979047, "loss": 0.0226, "step": 40640 }, { "epoch": 0.44, "learning_rate": 0.00023408250632418756, "loss": 0.0241, "step": 40650 }, { "epoch": 0.44, "learning_rate": 0.00023406629045858468, "loss": 0.0298, "step": 40660 }, { "epoch": 0.44, "learning_rate": 0.00023405007459298174, "loss": 0.0223, "step": 40670 }, { "epoch": 0.44, "learning_rate": 0.00023403385872737884, "loss": 0.0277, "step": 40680 }, { "epoch": 0.44, "learning_rate": 0.00023401764286177596, "loss": 0.0224, "step": 40690 }, { "epoch": 0.44, "learning_rate": 0.00023400142699617305, "loss": 0.0231, "step": 40700 }, { "epoch": 0.44, "learning_rate": 0.00023398521113057012, "loss": 0.0194, "step": 40710 }, { "epoch": 0.44, "learning_rate": 0.0002339689952649672, "loss": 0.0232, "step": 40720 }, { "epoch": 0.44, "learning_rate": 0.00023395277939936433, "loss": 0.0228, "step": 40730 }, { "epoch": 0.44, "learning_rate": 0.00023393656353376142, "loss": 0.0203, "step": 40740 }, { "epoch": 0.44, "learning_rate": 0.0002339203476681585, "loss": 0.0197, "step": 40750 }, { "epoch": 0.44, "learning_rate": 0.0002339041318025556, "loss": 0.021, "step": 40760 }, { "epoch": 0.44, "learning_rate": 0.0002338879159369527, "loss": 0.0217, "step": 40770 }, { "epoch": 0.44, "learning_rate": 0.0002338717000713498, "loss": 0.0212, "step": 40780 }, { "epoch": 0.44, "learning_rate": 0.00023385548420574686, "loss": 0.0185, "step": 40790 }, { "epoch": 0.44, "learning_rate": 0.00023383926834014398, "loss": 0.0203, "step": 40800 }, { "epoch": 0.44, "learning_rate": 0.00023382305247454107, "loss": 0.0233, "step": 40810 }, { "epoch": 0.44, "learning_rate": 0.00023380683660893816, "loss": 0.0176, "step": 40820 }, { "epoch": 0.44, "learning_rate": 0.00023379062074333526, "loss": 0.0208, "step": 40830 }, { "epoch": 0.44, "learning_rate": 0.00023377440487773235, "loss": 0.0205, "step": 40840 }, { "epoch": 0.44, "learning_rate": 0.00023375818901212944, "loss": 0.0216, "step": 40850 }, { "epoch": 0.44, "learning_rate": 0.00023374197314652656, "loss": 0.0211, "step": 40860 }, { "epoch": 0.44, "learning_rate": 0.00023372575728092363, "loss": 0.0192, "step": 40870 }, { "epoch": 0.44, "learning_rate": 0.00023370954141532072, "loss": 0.0247, "step": 40880 }, { "epoch": 0.44, "learning_rate": 0.0002336933255497178, "loss": 0.0191, "step": 40890 }, { "epoch": 0.44, "learning_rate": 0.00023367710968411493, "loss": 0.0189, "step": 40900 }, { "epoch": 0.44, "learning_rate": 0.000233660893818512, "loss": 0.0266, "step": 40910 }, { "epoch": 0.44, "learning_rate": 0.0002336446779529091, "loss": 0.0178, "step": 40920 }, { "epoch": 0.44, "learning_rate": 0.0002336284620873062, "loss": 0.0186, "step": 40930 }, { "epoch": 0.44, "learning_rate": 0.0002336122462217033, "loss": 0.0183, "step": 40940 }, { "epoch": 0.44, "learning_rate": 0.00023359603035610037, "loss": 0.018, "step": 40950 }, { "epoch": 0.44, "learning_rate": 0.00023357981449049746, "loss": 0.0238, "step": 40960 }, { "epoch": 0.44, "learning_rate": 0.00023356359862489458, "loss": 0.02, "step": 40970 }, { "epoch": 0.44, "learning_rate": 0.00023354738275929167, "loss": 0.0184, "step": 40980 }, { "epoch": 0.44, "learning_rate": 0.00023353116689368874, "loss": 0.0184, "step": 40990 }, { "epoch": 0.44, "learning_rate": 0.00023351495102808586, "loss": 0.0204, "step": 41000 }, { "epoch": 0.44, "eval_cer": 0.9215903425248898, "eval_loss": 0.013930886052548885, "eval_runtime": 121.8476, "eval_samples_per_second": 16.414, "eval_steps_per_second": 4.103, "step": 41000 }, { "epoch": 0.44, "learning_rate": 0.00023349873516248295, "loss": 0.0193, "step": 41010 }, { "epoch": 0.44, "learning_rate": 0.00023348251929688005, "loss": 0.0246, "step": 41020 }, { "epoch": 0.44, "learning_rate": 0.00023346630343127717, "loss": 0.0188, "step": 41030 }, { "epoch": 0.44, "learning_rate": 0.00023345008756567423, "loss": 0.0192, "step": 41040 }, { "epoch": 0.44, "learning_rate": 0.00023343387170007132, "loss": 0.0175, "step": 41050 }, { "epoch": 0.44, "learning_rate": 0.00023341765583446844, "loss": 0.0205, "step": 41060 }, { "epoch": 0.44, "learning_rate": 0.00023340143996886554, "loss": 0.0214, "step": 41070 }, { "epoch": 0.44, "learning_rate": 0.0002333852241032626, "loss": 0.0165, "step": 41080 }, { "epoch": 0.44, "learning_rate": 0.0002333690082376597, "loss": 0.021, "step": 41090 }, { "epoch": 0.44, "learning_rate": 0.00023335279237205681, "loss": 0.0176, "step": 41100 }, { "epoch": 0.44, "learning_rate": 0.0002333365765064539, "loss": 0.0176, "step": 41110 }, { "epoch": 0.44, "learning_rate": 0.00023332036064085097, "loss": 0.0187, "step": 41120 }, { "epoch": 0.44, "learning_rate": 0.0002333041447752481, "loss": 0.0183, "step": 41130 }, { "epoch": 0.44, "learning_rate": 0.00023328792890964519, "loss": 0.019, "step": 41140 }, { "epoch": 0.44, "learning_rate": 0.00023327171304404228, "loss": 0.0227, "step": 41150 }, { "epoch": 0.44, "learning_rate": 0.00023325549717843934, "loss": 0.0185, "step": 41160 }, { "epoch": 0.45, "learning_rate": 0.00023323928131283646, "loss": 0.0227, "step": 41170 }, { "epoch": 0.45, "learning_rate": 0.00023322306544723356, "loss": 0.0204, "step": 41180 }, { "epoch": 0.45, "learning_rate": 0.00023320684958163065, "loss": 0.0187, "step": 41190 }, { "epoch": 0.45, "learning_rate": 0.00023319063371602774, "loss": 0.0185, "step": 41200 }, { "epoch": 0.45, "learning_rate": 0.00023317441785042483, "loss": 0.0229, "step": 41210 }, { "epoch": 0.45, "learning_rate": 0.00023315820198482193, "loss": 0.0198, "step": 41220 }, { "epoch": 0.45, "learning_rate": 0.00023314198611921905, "loss": 0.0216, "step": 41230 }, { "epoch": 0.45, "learning_rate": 0.0002331257702536161, "loss": 0.02, "step": 41240 }, { "epoch": 0.45, "learning_rate": 0.0002331095543880132, "loss": 0.0196, "step": 41250 }, { "epoch": 0.45, "learning_rate": 0.0002330933385224103, "loss": 0.0188, "step": 41260 }, { "epoch": 0.45, "learning_rate": 0.00023307712265680742, "loss": 0.0233, "step": 41270 }, { "epoch": 0.45, "learning_rate": 0.00023306090679120448, "loss": 0.0226, "step": 41280 }, { "epoch": 0.45, "learning_rate": 0.00023304469092560158, "loss": 0.0209, "step": 41290 }, { "epoch": 0.45, "learning_rate": 0.0002330284750599987, "loss": 0.0196, "step": 41300 }, { "epoch": 0.45, "learning_rate": 0.0002330122591943958, "loss": 0.0213, "step": 41310 }, { "epoch": 0.45, "learning_rate": 0.00023299604332879285, "loss": 0.0207, "step": 41320 }, { "epoch": 0.45, "learning_rate": 0.00023297982746318995, "loss": 0.021, "step": 41330 }, { "epoch": 0.45, "learning_rate": 0.00023296361159758707, "loss": 0.0227, "step": 41340 }, { "epoch": 0.45, "learning_rate": 0.00023294739573198416, "loss": 0.0168, "step": 41350 }, { "epoch": 0.45, "learning_rate": 0.00023293117986638123, "loss": 0.0199, "step": 41360 }, { "epoch": 0.45, "learning_rate": 0.00023291496400077835, "loss": 0.0185, "step": 41370 }, { "epoch": 0.45, "learning_rate": 0.00023289874813517544, "loss": 0.0208, "step": 41380 }, { "epoch": 0.45, "learning_rate": 0.00023288253226957253, "loss": 0.0192, "step": 41390 }, { "epoch": 0.45, "learning_rate": 0.00023286631640396962, "loss": 0.0212, "step": 41400 }, { "epoch": 0.45, "learning_rate": 0.00023285010053836672, "loss": 0.0206, "step": 41410 }, { "epoch": 0.45, "learning_rate": 0.0002328338846727638, "loss": 0.0209, "step": 41420 }, { "epoch": 0.45, "learning_rate": 0.00023281766880716093, "loss": 0.0215, "step": 41430 }, { "epoch": 0.45, "learning_rate": 0.000232801452941558, "loss": 0.026, "step": 41440 }, { "epoch": 0.45, "learning_rate": 0.0002327852370759551, "loss": 0.0198, "step": 41450 }, { "epoch": 0.45, "learning_rate": 0.00023276902121035218, "loss": 0.0174, "step": 41460 }, { "epoch": 0.45, "learning_rate": 0.0002327528053447493, "loss": 0.0216, "step": 41470 }, { "epoch": 0.45, "learning_rate": 0.00023273658947914637, "loss": 0.0192, "step": 41480 }, { "epoch": 0.45, "learning_rate": 0.00023272037361354346, "loss": 0.0217, "step": 41490 }, { "epoch": 0.45, "learning_rate": 0.00023270415774794058, "loss": 0.0204, "step": 41500 }, { "epoch": 0.45, "learning_rate": 0.00023268794188233767, "loss": 0.0241, "step": 41510 }, { "epoch": 0.45, "learning_rate": 0.00023267172601673474, "loss": 0.0202, "step": 41520 }, { "epoch": 0.45, "learning_rate": 0.00023265551015113183, "loss": 0.0151, "step": 41530 }, { "epoch": 0.45, "learning_rate": 0.00023263929428552895, "loss": 0.0216, "step": 41540 }, { "epoch": 0.45, "learning_rate": 0.00023262307841992604, "loss": 0.0205, "step": 41550 }, { "epoch": 0.45, "learning_rate": 0.0002326068625543231, "loss": 0.0205, "step": 41560 }, { "epoch": 0.45, "learning_rate": 0.00023259064668872023, "loss": 0.0186, "step": 41570 }, { "epoch": 0.45, "learning_rate": 0.00023257443082311732, "loss": 0.0189, "step": 41580 }, { "epoch": 0.45, "learning_rate": 0.0002325582149575144, "loss": 0.0158, "step": 41590 }, { "epoch": 0.45, "learning_rate": 0.00023254199909191148, "loss": 0.0183, "step": 41600 }, { "epoch": 0.45, "learning_rate": 0.0002325257832263086, "loss": 0.0212, "step": 41610 }, { "epoch": 0.45, "learning_rate": 0.0002325095673607057, "loss": 0.0186, "step": 41620 }, { "epoch": 0.45, "learning_rate": 0.0002324933514951028, "loss": 0.0201, "step": 41630 }, { "epoch": 0.45, "learning_rate": 0.00023247713562949988, "loss": 0.0185, "step": 41640 }, { "epoch": 0.45, "learning_rate": 0.00023246091976389697, "loss": 0.0198, "step": 41650 }, { "epoch": 0.45, "learning_rate": 0.00023244470389829406, "loss": 0.0191, "step": 41660 }, { "epoch": 0.45, "learning_rate": 0.00023242848803269118, "loss": 0.0198, "step": 41670 }, { "epoch": 0.45, "learning_rate": 0.00023241227216708825, "loss": 0.0217, "step": 41680 }, { "epoch": 0.45, "learning_rate": 0.00023239605630148534, "loss": 0.0248, "step": 41690 }, { "epoch": 0.45, "learning_rate": 0.00023237984043588246, "loss": 0.0183, "step": 41700 }, { "epoch": 0.45, "learning_rate": 0.00023236362457027955, "loss": 0.0205, "step": 41710 }, { "epoch": 0.45, "learning_rate": 0.00023234740870467665, "loss": 0.0228, "step": 41720 }, { "epoch": 0.45, "learning_rate": 0.0002323311928390737, "loss": 0.017, "step": 41730 }, { "epoch": 0.45, "learning_rate": 0.00023231497697347083, "loss": 0.0254, "step": 41740 }, { "epoch": 0.45, "learning_rate": 0.00023229876110786792, "loss": 0.0165, "step": 41750 }, { "epoch": 0.45, "learning_rate": 0.00023228254524226502, "loss": 0.0208, "step": 41760 }, { "epoch": 0.45, "learning_rate": 0.0002322663293766621, "loss": 0.0194, "step": 41770 }, { "epoch": 0.45, "learning_rate": 0.0002322501135110592, "loss": 0.0197, "step": 41780 }, { "epoch": 0.45, "learning_rate": 0.0002322338976454563, "loss": 0.0208, "step": 41790 }, { "epoch": 0.45, "learning_rate": 0.00023221768177985341, "loss": 0.0203, "step": 41800 }, { "epoch": 0.45, "learning_rate": 0.00023220146591425048, "loss": 0.0214, "step": 41810 }, { "epoch": 0.45, "learning_rate": 0.00023218525004864757, "loss": 0.0236, "step": 41820 }, { "epoch": 0.45, "learning_rate": 0.00023216903418304467, "loss": 0.0195, "step": 41830 }, { "epoch": 0.45, "learning_rate": 0.00023215281831744179, "loss": 0.0208, "step": 41840 }, { "epoch": 0.45, "learning_rate": 0.00023213660245183885, "loss": 0.019, "step": 41850 }, { "epoch": 0.45, "learning_rate": 0.00023212038658623594, "loss": 0.018, "step": 41860 }, { "epoch": 0.45, "learning_rate": 0.00023210417072063306, "loss": 0.0249, "step": 41870 }, { "epoch": 0.45, "learning_rate": 0.00023208795485503016, "loss": 0.0197, "step": 41880 }, { "epoch": 0.45, "learning_rate": 0.00023207173898942722, "loss": 0.0221, "step": 41890 }, { "epoch": 0.45, "learning_rate": 0.00023205552312382432, "loss": 0.0179, "step": 41900 }, { "epoch": 0.45, "learning_rate": 0.00023203930725822143, "loss": 0.0187, "step": 41910 }, { "epoch": 0.45, "learning_rate": 0.00023202309139261853, "loss": 0.0209, "step": 41920 }, { "epoch": 0.45, "learning_rate": 0.0002320068755270156, "loss": 0.0194, "step": 41930 }, { "epoch": 0.45, "learning_rate": 0.0002319906596614127, "loss": 0.0208, "step": 41940 }, { "epoch": 0.45, "learning_rate": 0.0002319744437958098, "loss": 0.0192, "step": 41950 }, { "epoch": 0.45, "learning_rate": 0.0002319582279302069, "loss": 0.0191, "step": 41960 }, { "epoch": 0.45, "learning_rate": 0.00023194201206460396, "loss": 0.0287, "step": 41970 }, { "epoch": 0.45, "learning_rate": 0.00023192579619900108, "loss": 0.0187, "step": 41980 }, { "epoch": 0.45, "learning_rate": 0.00023190958033339818, "loss": 0.0169, "step": 41990 }, { "epoch": 0.45, "learning_rate": 0.0002318933644677953, "loss": 0.0201, "step": 42000 }, { "epoch": 0.45, "eval_cer": 0.9215564670095912, "eval_loss": 0.014593328349292278, "eval_runtime": 121.8424, "eval_samples_per_second": 16.415, "eval_steps_per_second": 4.104, "step": 42000 }, { "epoch": 0.45, "learning_rate": 0.00023187714860219236, "loss": 0.0195, "step": 42010 }, { "epoch": 0.45, "learning_rate": 0.00023186093273658946, "loss": 0.021, "step": 42020 }, { "epoch": 0.45, "learning_rate": 0.00023184471687098655, "loss": 0.0185, "step": 42030 }, { "epoch": 0.45, "learning_rate": 0.00023182850100538367, "loss": 0.0203, "step": 42040 }, { "epoch": 0.45, "learning_rate": 0.00023181228513978073, "loss": 0.0206, "step": 42050 }, { "epoch": 0.45, "learning_rate": 0.00023179606927417783, "loss": 0.0186, "step": 42060 }, { "epoch": 0.45, "learning_rate": 0.00023177985340857495, "loss": 0.0199, "step": 42070 }, { "epoch": 0.45, "learning_rate": 0.00023176363754297204, "loss": 0.0214, "step": 42080 }, { "epoch": 0.46, "learning_rate": 0.0002317474216773691, "loss": 0.0216, "step": 42090 }, { "epoch": 0.46, "learning_rate": 0.0002317312058117662, "loss": 0.0286, "step": 42100 }, { "epoch": 0.46, "learning_rate": 0.00023171498994616332, "loss": 0.018, "step": 42110 }, { "epoch": 0.46, "learning_rate": 0.0002316987740805604, "loss": 0.0187, "step": 42120 }, { "epoch": 0.46, "learning_rate": 0.00023168255821495748, "loss": 0.0179, "step": 42130 }, { "epoch": 0.46, "learning_rate": 0.0002316663423493546, "loss": 0.0186, "step": 42140 }, { "epoch": 0.46, "learning_rate": 0.0002316501264837517, "loss": 0.0187, "step": 42150 }, { "epoch": 0.46, "learning_rate": 0.00023163391061814878, "loss": 0.0201, "step": 42160 }, { "epoch": 0.46, "learning_rate": 0.00023161769475254585, "loss": 0.0212, "step": 42170 }, { "epoch": 0.46, "learning_rate": 0.00023160147888694297, "loss": 0.0169, "step": 42180 }, { "epoch": 0.46, "learning_rate": 0.00023158526302134006, "loss": 0.0245, "step": 42190 }, { "epoch": 0.46, "learning_rate": 0.00023156904715573715, "loss": 0.0226, "step": 42200 }, { "epoch": 0.46, "learning_rate": 0.00023155283129013424, "loss": 0.0248, "step": 42210 }, { "epoch": 0.46, "learning_rate": 0.00023153661542453134, "loss": 0.0173, "step": 42220 }, { "epoch": 0.46, "learning_rate": 0.00023152039955892843, "loss": 0.0229, "step": 42230 }, { "epoch": 0.46, "learning_rate": 0.00023150418369332555, "loss": 0.0245, "step": 42240 }, { "epoch": 0.46, "learning_rate": 0.00023148796782772262, "loss": 0.0199, "step": 42250 }, { "epoch": 0.46, "learning_rate": 0.0002314717519621197, "loss": 0.0202, "step": 42260 }, { "epoch": 0.46, "learning_rate": 0.0002314555360965168, "loss": 0.0217, "step": 42270 }, { "epoch": 0.46, "learning_rate": 0.00023143932023091392, "loss": 0.0171, "step": 42280 }, { "epoch": 0.46, "learning_rate": 0.00023142310436531099, "loss": 0.0241, "step": 42290 }, { "epoch": 0.46, "learning_rate": 0.00023140688849970808, "loss": 0.0201, "step": 42300 }, { "epoch": 0.46, "learning_rate": 0.0002313906726341052, "loss": 0.0248, "step": 42310 }, { "epoch": 0.46, "learning_rate": 0.0002313744567685023, "loss": 0.0161, "step": 42320 }, { "epoch": 0.46, "learning_rate": 0.00023135824090289936, "loss": 0.0192, "step": 42330 }, { "epoch": 0.46, "learning_rate": 0.00023134202503729645, "loss": 0.02, "step": 42340 }, { "epoch": 0.46, "learning_rate": 0.00023132580917169357, "loss": 0.0224, "step": 42350 }, { "epoch": 0.46, "learning_rate": 0.00023130959330609066, "loss": 0.0235, "step": 42360 }, { "epoch": 0.46, "learning_rate": 0.00023129337744048773, "loss": 0.0214, "step": 42370 }, { "epoch": 0.46, "learning_rate": 0.00023127716157488485, "loss": 0.0168, "step": 42380 }, { "epoch": 0.46, "learning_rate": 0.00023126094570928194, "loss": 0.0215, "step": 42390 }, { "epoch": 0.46, "learning_rate": 0.00023124472984367903, "loss": 0.0225, "step": 42400 }, { "epoch": 0.46, "learning_rate": 0.00023122851397807613, "loss": 0.0244, "step": 42410 }, { "epoch": 0.46, "learning_rate": 0.00023121229811247322, "loss": 0.0203, "step": 42420 }, { "epoch": 0.46, "learning_rate": 0.0002311960822468703, "loss": 0.0202, "step": 42430 }, { "epoch": 0.46, "learning_rate": 0.00023117986638126743, "loss": 0.019, "step": 42440 }, { "epoch": 0.46, "learning_rate": 0.00023116365051566452, "loss": 0.0203, "step": 42450 }, { "epoch": 0.46, "learning_rate": 0.0002311474346500616, "loss": 0.0175, "step": 42460 }, { "epoch": 0.46, "learning_rate": 0.00023113121878445868, "loss": 0.018, "step": 42470 }, { "epoch": 0.46, "learning_rate": 0.0002311150029188558, "loss": 0.0193, "step": 42480 }, { "epoch": 0.46, "learning_rate": 0.0002310987870532529, "loss": 0.0216, "step": 42490 }, { "epoch": 0.46, "learning_rate": 0.00023108257118764996, "loss": 0.0183, "step": 42500 }, { "epoch": 0.46, "learning_rate": 0.00023106635532204708, "loss": 0.021, "step": 42510 }, { "epoch": 0.46, "learning_rate": 0.00023105013945644417, "loss": 0.0197, "step": 42520 }, { "epoch": 0.46, "learning_rate": 0.00023103392359084127, "loss": 0.024, "step": 42530 }, { "epoch": 0.46, "learning_rate": 0.00023101770772523833, "loss": 0.0198, "step": 42540 }, { "epoch": 0.46, "learning_rate": 0.00023100149185963545, "loss": 0.0188, "step": 42550 }, { "epoch": 0.46, "learning_rate": 0.00023098527599403254, "loss": 0.0177, "step": 42560 }, { "epoch": 0.46, "learning_rate": 0.00023096906012842964, "loss": 0.0234, "step": 42570 }, { "epoch": 0.46, "learning_rate": 0.00023095284426282673, "loss": 0.0221, "step": 42580 }, { "epoch": 0.46, "learning_rate": 0.00023093662839722382, "loss": 0.0199, "step": 42590 }, { "epoch": 0.46, "learning_rate": 0.00023092041253162092, "loss": 0.0195, "step": 42600 }, { "epoch": 0.46, "learning_rate": 0.00023090419666601804, "loss": 0.0172, "step": 42610 }, { "epoch": 0.46, "learning_rate": 0.0002308879808004151, "loss": 0.0201, "step": 42620 }, { "epoch": 0.46, "learning_rate": 0.0002308717649348122, "loss": 0.0202, "step": 42630 }, { "epoch": 0.46, "learning_rate": 0.00023085554906920931, "loss": 0.0204, "step": 42640 }, { "epoch": 0.46, "learning_rate": 0.0002308393332036064, "loss": 0.0171, "step": 42650 }, { "epoch": 0.46, "learning_rate": 0.00023082311733800347, "loss": 0.0206, "step": 42660 }, { "epoch": 0.46, "learning_rate": 0.00023080690147240056, "loss": 0.0221, "step": 42670 }, { "epoch": 0.46, "learning_rate": 0.00023079068560679768, "loss": 0.0199, "step": 42680 }, { "epoch": 0.46, "learning_rate": 0.00023077446974119478, "loss": 0.0182, "step": 42690 }, { "epoch": 0.46, "learning_rate": 0.00023075825387559184, "loss": 0.0213, "step": 42700 }, { "epoch": 0.46, "learning_rate": 0.00023074203800998896, "loss": 0.0206, "step": 42710 }, { "epoch": 0.46, "learning_rate": 0.00023072582214438606, "loss": 0.0188, "step": 42720 }, { "epoch": 0.46, "learning_rate": 0.00023070960627878315, "loss": 0.0198, "step": 42730 }, { "epoch": 0.46, "learning_rate": 0.00023069339041318021, "loss": 0.0178, "step": 42740 }, { "epoch": 0.46, "learning_rate": 0.00023067717454757733, "loss": 0.022, "step": 42750 }, { "epoch": 0.46, "learning_rate": 0.00023066095868197443, "loss": 0.0211, "step": 42760 }, { "epoch": 0.46, "learning_rate": 0.00023064474281637152, "loss": 0.0179, "step": 42770 }, { "epoch": 0.46, "learning_rate": 0.0002306285269507686, "loss": 0.0185, "step": 42780 }, { "epoch": 0.46, "learning_rate": 0.0002306123110851657, "loss": 0.0184, "step": 42790 }, { "epoch": 0.46, "learning_rate": 0.0002305960952195628, "loss": 0.0186, "step": 42800 }, { "epoch": 0.46, "learning_rate": 0.00023057987935395992, "loss": 0.0192, "step": 42810 }, { "epoch": 0.46, "learning_rate": 0.00023056366348835698, "loss": 0.0209, "step": 42820 }, { "epoch": 0.46, "learning_rate": 0.00023054744762275408, "loss": 0.0247, "step": 42830 }, { "epoch": 0.46, "learning_rate": 0.00023053123175715117, "loss": 0.0208, "step": 42840 }, { "epoch": 0.46, "learning_rate": 0.0002305150158915483, "loss": 0.0182, "step": 42850 }, { "epoch": 0.46, "learning_rate": 0.00023049880002594535, "loss": 0.0174, "step": 42860 }, { "epoch": 0.46, "learning_rate": 0.00023048258416034245, "loss": 0.0247, "step": 42870 }, { "epoch": 0.46, "learning_rate": 0.00023046636829473957, "loss": 0.0199, "step": 42880 }, { "epoch": 0.46, "learning_rate": 0.00023045015242913666, "loss": 0.0228, "step": 42890 }, { "epoch": 0.46, "learning_rate": 0.00023043393656353372, "loss": 0.0184, "step": 42900 }, { "epoch": 0.46, "learning_rate": 0.00023041772069793082, "loss": 0.0169, "step": 42910 }, { "epoch": 0.46, "learning_rate": 0.00023040150483232794, "loss": 0.0202, "step": 42920 }, { "epoch": 0.46, "learning_rate": 0.00023038528896672503, "loss": 0.0206, "step": 42930 }, { "epoch": 0.46, "learning_rate": 0.0002303690731011221, "loss": 0.025, "step": 42940 }, { "epoch": 0.46, "learning_rate": 0.00023035285723551922, "loss": 0.0205, "step": 42950 }, { "epoch": 0.46, "learning_rate": 0.0002303366413699163, "loss": 0.0183, "step": 42960 }, { "epoch": 0.46, "learning_rate": 0.0002303204255043134, "loss": 0.0197, "step": 42970 }, { "epoch": 0.46, "learning_rate": 0.00023030420963871047, "loss": 0.019, "step": 42980 }, { "epoch": 0.46, "learning_rate": 0.0002302879937731076, "loss": 0.0169, "step": 42990 }, { "epoch": 0.46, "learning_rate": 0.00023027177790750468, "loss": 0.0202, "step": 43000 }, { "epoch": 0.46, "eval_cer": 0.9215425693622891, "eval_loss": 0.013244155794382095, "eval_runtime": 121.8128, "eval_samples_per_second": 16.419, "eval_steps_per_second": 4.105, "step": 43000 }, { "epoch": 0.46, "learning_rate": 0.0002302555620419018, "loss": 0.0225, "step": 43010 }, { "epoch": 0.47, "learning_rate": 0.00023023934617629886, "loss": 0.0206, "step": 43020 }, { "epoch": 0.47, "learning_rate": 0.00023022313031069596, "loss": 0.0222, "step": 43030 }, { "epoch": 0.47, "learning_rate": 0.00023020691444509305, "loss": 0.0198, "step": 43040 }, { "epoch": 0.47, "learning_rate": 0.00023019069857949017, "loss": 0.0176, "step": 43050 }, { "epoch": 0.47, "learning_rate": 0.00023017448271388724, "loss": 0.0203, "step": 43060 }, { "epoch": 0.47, "learning_rate": 0.00023015826684828433, "loss": 0.0183, "step": 43070 }, { "epoch": 0.47, "learning_rate": 0.00023014205098268145, "loss": 0.0199, "step": 43080 }, { "epoch": 0.47, "learning_rate": 0.00023012583511707854, "loss": 0.0231, "step": 43090 }, { "epoch": 0.47, "learning_rate": 0.0002301096192514756, "loss": 0.0228, "step": 43100 }, { "epoch": 0.47, "learning_rate": 0.0002300934033858727, "loss": 0.0244, "step": 43110 }, { "epoch": 0.47, "learning_rate": 0.00023007718752026982, "loss": 0.0183, "step": 43120 }, { "epoch": 0.47, "learning_rate": 0.0002300609716546669, "loss": 0.0194, "step": 43130 }, { "epoch": 0.47, "learning_rate": 0.00023004475578906398, "loss": 0.0218, "step": 43140 }, { "epoch": 0.47, "learning_rate": 0.0002300285399234611, "loss": 0.0202, "step": 43150 }, { "epoch": 0.47, "learning_rate": 0.0002300123240578582, "loss": 0.0209, "step": 43160 }, { "epoch": 0.47, "learning_rate": 0.00022999610819225528, "loss": 0.0208, "step": 43170 }, { "epoch": 0.47, "learning_rate": 0.0002299798923266524, "loss": 0.0192, "step": 43180 }, { "epoch": 0.47, "learning_rate": 0.00022996367646104947, "loss": 0.0202, "step": 43190 }, { "epoch": 0.47, "learning_rate": 0.00022994746059544656, "loss": 0.0179, "step": 43200 }, { "epoch": 0.47, "learning_rate": 0.00022993124472984365, "loss": 0.0182, "step": 43210 }, { "epoch": 0.47, "learning_rate": 0.00022991502886424077, "loss": 0.0226, "step": 43220 }, { "epoch": 0.47, "learning_rate": 0.00022989881299863784, "loss": 0.0189, "step": 43230 }, { "epoch": 0.47, "learning_rate": 0.00022988259713303493, "loss": 0.02, "step": 43240 }, { "epoch": 0.47, "learning_rate": 0.00022986638126743205, "loss": 0.0165, "step": 43250 }, { "epoch": 0.47, "learning_rate": 0.00022985016540182914, "loss": 0.0203, "step": 43260 }, { "epoch": 0.47, "learning_rate": 0.0002298339495362262, "loss": 0.0205, "step": 43270 }, { "epoch": 0.47, "learning_rate": 0.0002298177336706233, "loss": 0.0197, "step": 43280 }, { "epoch": 0.47, "learning_rate": 0.00022980151780502042, "loss": 0.0204, "step": 43290 }, { "epoch": 0.47, "learning_rate": 0.00022978530193941752, "loss": 0.0256, "step": 43300 }, { "epoch": 0.47, "learning_rate": 0.00022976908607381458, "loss": 0.0214, "step": 43310 }, { "epoch": 0.47, "learning_rate": 0.0002297528702082117, "loss": 0.0182, "step": 43320 }, { "epoch": 0.47, "learning_rate": 0.0002297366543426088, "loss": 0.0181, "step": 43330 }, { "epoch": 0.47, "learning_rate": 0.0002297204384770059, "loss": 0.0207, "step": 43340 }, { "epoch": 0.47, "learning_rate": 0.00022970422261140295, "loss": 0.0183, "step": 43350 }, { "epoch": 0.47, "learning_rate": 0.00022968800674580007, "loss": 0.0176, "step": 43360 }, { "epoch": 0.47, "learning_rate": 0.00022967179088019717, "loss": 0.0168, "step": 43370 }, { "epoch": 0.47, "learning_rate": 0.00022965557501459429, "loss": 0.0167, "step": 43380 }, { "epoch": 0.47, "learning_rate": 0.00022963935914899135, "loss": 0.0237, "step": 43390 }, { "epoch": 0.47, "learning_rate": 0.00022962314328338844, "loss": 0.0192, "step": 43400 }, { "epoch": 0.47, "learning_rate": 0.00022960692741778554, "loss": 0.0178, "step": 43410 }, { "epoch": 0.47, "learning_rate": 0.00022959071155218266, "loss": 0.0197, "step": 43420 }, { "epoch": 0.47, "learning_rate": 0.00022957449568657972, "loss": 0.0192, "step": 43430 }, { "epoch": 0.47, "learning_rate": 0.00022955827982097681, "loss": 0.018, "step": 43440 }, { "epoch": 0.47, "learning_rate": 0.00022954206395537393, "loss": 0.0187, "step": 43450 }, { "epoch": 0.47, "learning_rate": 0.00022952584808977103, "loss": 0.0201, "step": 43460 }, { "epoch": 0.47, "learning_rate": 0.0002295096322241681, "loss": 0.0164, "step": 43470 }, { "epoch": 0.47, "learning_rate": 0.00022949341635856519, "loss": 0.0255, "step": 43480 }, { "epoch": 0.47, "learning_rate": 0.0002294772004929623, "loss": 0.0187, "step": 43490 }, { "epoch": 0.47, "learning_rate": 0.0002294609846273594, "loss": 0.0187, "step": 43500 }, { "epoch": 0.47, "learning_rate": 0.00022944476876175646, "loss": 0.0181, "step": 43510 }, { "epoch": 0.47, "learning_rate": 0.00022942855289615358, "loss": 0.0193, "step": 43520 }, { "epoch": 0.47, "learning_rate": 0.00022941233703055068, "loss": 0.0188, "step": 43530 }, { "epoch": 0.47, "learning_rate": 0.00022939612116494777, "loss": 0.0185, "step": 43540 }, { "epoch": 0.47, "learning_rate": 0.00022937990529934483, "loss": 0.0165, "step": 43550 }, { "epoch": 0.47, "learning_rate": 0.00022936368943374195, "loss": 0.018, "step": 43560 }, { "epoch": 0.47, "learning_rate": 0.00022934747356813905, "loss": 0.0186, "step": 43570 }, { "epoch": 0.47, "learning_rate": 0.00022933125770253614, "loss": 0.0167, "step": 43580 }, { "epoch": 0.47, "learning_rate": 0.00022931504183693323, "loss": 0.0161, "step": 43590 }, { "epoch": 0.47, "learning_rate": 0.00022929882597133033, "loss": 0.0156, "step": 43600 }, { "epoch": 0.47, "learning_rate": 0.00022928261010572742, "loss": 0.0164, "step": 43610 }, { "epoch": 0.47, "learning_rate": 0.00022926639424012454, "loss": 0.0177, "step": 43620 }, { "epoch": 0.47, "learning_rate": 0.0002292501783745216, "loss": 0.0186, "step": 43630 }, { "epoch": 0.47, "learning_rate": 0.0002292339625089187, "loss": 0.0185, "step": 43640 }, { "epoch": 0.47, "learning_rate": 0.00022921774664331582, "loss": 0.0275, "step": 43650 }, { "epoch": 0.47, "learning_rate": 0.0002292015307777129, "loss": 0.0258, "step": 43660 }, { "epoch": 0.47, "learning_rate": 0.00022918531491210997, "loss": 0.0386, "step": 43670 }, { "epoch": 0.47, "learning_rate": 0.00022916909904650707, "loss": 0.0334, "step": 43680 }, { "epoch": 0.47, "learning_rate": 0.0002291528831809042, "loss": 0.0205, "step": 43690 }, { "epoch": 0.47, "learning_rate": 0.00022913666731530128, "loss": 0.0176, "step": 43700 }, { "epoch": 0.47, "learning_rate": 0.00022912045144969835, "loss": 0.0203, "step": 43710 }, { "epoch": 0.47, "learning_rate": 0.00022910423558409547, "loss": 0.0175, "step": 43720 }, { "epoch": 0.47, "learning_rate": 0.00022908801971849256, "loss": 0.0232, "step": 43730 }, { "epoch": 0.47, "learning_rate": 0.00022907180385288965, "loss": 0.0187, "step": 43740 }, { "epoch": 0.47, "learning_rate": 0.00022905558798728672, "loss": 0.0187, "step": 43750 }, { "epoch": 0.47, "learning_rate": 0.00022903937212168384, "loss": 0.0142, "step": 43760 }, { "epoch": 0.47, "learning_rate": 0.00022902315625608093, "loss": 0.0209, "step": 43770 }, { "epoch": 0.47, "learning_rate": 0.00022900694039047802, "loss": 0.0231, "step": 43780 }, { "epoch": 0.47, "learning_rate": 0.00022899072452487511, "loss": 0.0214, "step": 43790 }, { "epoch": 0.47, "learning_rate": 0.0002289745086592722, "loss": 0.0171, "step": 43800 }, { "epoch": 0.47, "learning_rate": 0.0002289582927936693, "loss": 0.0223, "step": 43810 }, { "epoch": 0.47, "learning_rate": 0.00022894207692806642, "loss": 0.022, "step": 43820 }, { "epoch": 0.47, "learning_rate": 0.00022892586106246349, "loss": 0.0252, "step": 43830 }, { "epoch": 0.47, "learning_rate": 0.00022890964519686058, "loss": 0.0202, "step": 43840 }, { "epoch": 0.47, "learning_rate": 0.00022889342933125767, "loss": 0.0213, "step": 43850 }, { "epoch": 0.47, "learning_rate": 0.0002288772134656548, "loss": 0.0185, "step": 43860 }, { "epoch": 0.47, "learning_rate": 0.00022886099760005186, "loss": 0.0249, "step": 43870 }, { "epoch": 0.47, "learning_rate": 0.00022884478173444895, "loss": 0.019, "step": 43880 }, { "epoch": 0.47, "learning_rate": 0.00022882856586884607, "loss": 0.0218, "step": 43890 }, { "epoch": 0.47, "learning_rate": 0.00022881235000324316, "loss": 0.0225, "step": 43900 }, { "epoch": 0.47, "learning_rate": 0.00022879613413764025, "loss": 0.0185, "step": 43910 }, { "epoch": 0.47, "learning_rate": 0.00022877991827203732, "loss": 0.0228, "step": 43920 }, { "epoch": 0.47, "learning_rate": 0.00022876370240643444, "loss": 0.0191, "step": 43930 }, { "epoch": 0.48, "learning_rate": 0.00022874748654083153, "loss": 0.02, "step": 43940 }, { "epoch": 0.48, "learning_rate": 0.00022873127067522865, "loss": 0.0179, "step": 43950 }, { "epoch": 0.48, "learning_rate": 0.00022871505480962572, "loss": 0.0217, "step": 43960 }, { "epoch": 0.48, "learning_rate": 0.0002286988389440228, "loss": 0.0395, "step": 43970 }, { "epoch": 0.48, "learning_rate": 0.0002286826230784199, "loss": 0.0245, "step": 43980 }, { "epoch": 0.48, "learning_rate": 0.00022866640721281702, "loss": 0.0205, "step": 43990 }, { "epoch": 0.48, "learning_rate": 0.0002286501913472141, "loss": 0.0219, "step": 44000 }, { "epoch": 0.48, "eval_cer": 0.9215529925977656, "eval_loss": 0.0145536158233881, "eval_runtime": 121.7531, "eval_samples_per_second": 16.427, "eval_steps_per_second": 4.107, "step": 44000 }, { "epoch": 0.48, "learning_rate": 0.00022863397548161118, "loss": 0.0175, "step": 44010 }, { "epoch": 0.48, "learning_rate": 0.0002286177596160083, "loss": 0.0204, "step": 44020 }, { "epoch": 0.48, "learning_rate": 0.0002286015437504054, "loss": 0.0216, "step": 44030 }, { "epoch": 0.48, "learning_rate": 0.00022858532788480246, "loss": 0.023, "step": 44040 }, { "epoch": 0.48, "learning_rate": 0.00022856911201919955, "loss": 0.0179, "step": 44050 }, { "epoch": 0.48, "learning_rate": 0.00022855289615359667, "loss": 0.018, "step": 44060 }, { "epoch": 0.48, "learning_rate": 0.00022853668028799377, "loss": 0.0216, "step": 44070 }, { "epoch": 0.48, "learning_rate": 0.00022852046442239083, "loss": 0.0212, "step": 44080 }, { "epoch": 0.48, "learning_rate": 0.00022850424855678795, "loss": 0.0205, "step": 44090 }, { "epoch": 0.48, "learning_rate": 0.00022848803269118504, "loss": 0.0206, "step": 44100 }, { "epoch": 0.48, "learning_rate": 0.00022847181682558214, "loss": 0.0229, "step": 44110 }, { "epoch": 0.48, "learning_rate": 0.0002284556009599792, "loss": 0.0218, "step": 44120 }, { "epoch": 0.48, "learning_rate": 0.00022843938509437632, "loss": 0.0147, "step": 44130 }, { "epoch": 0.48, "learning_rate": 0.00022842316922877341, "loss": 0.0186, "step": 44140 }, { "epoch": 0.48, "learning_rate": 0.0002284069533631705, "loss": 0.0221, "step": 44150 }, { "epoch": 0.48, "learning_rate": 0.0002283907374975676, "loss": 0.0179, "step": 44160 }, { "epoch": 0.48, "learning_rate": 0.0002283745216319647, "loss": 0.0179, "step": 44170 }, { "epoch": 0.48, "learning_rate": 0.00022835830576636179, "loss": 0.02, "step": 44180 }, { "epoch": 0.48, "learning_rate": 0.0002283420899007589, "loss": 0.0192, "step": 44190 }, { "epoch": 0.48, "learning_rate": 0.00022832587403515597, "loss": 0.0208, "step": 44200 }, { "epoch": 0.48, "learning_rate": 0.00022830965816955306, "loss": 0.0195, "step": 44210 }, { "epoch": 0.48, "learning_rate": 0.00022829344230395016, "loss": 0.0206, "step": 44220 }, { "epoch": 0.48, "learning_rate": 0.00022827722643834728, "loss": 0.0191, "step": 44230 }, { "epoch": 0.48, "learning_rate": 0.00022826101057274434, "loss": 0.0192, "step": 44240 }, { "epoch": 0.48, "learning_rate": 0.00022824479470714144, "loss": 0.0199, "step": 44250 }, { "epoch": 0.48, "learning_rate": 0.00022822857884153855, "loss": 0.0211, "step": 44260 }, { "epoch": 0.48, "learning_rate": 0.00022821236297593565, "loss": 0.0216, "step": 44270 }, { "epoch": 0.48, "learning_rate": 0.0002281961471103327, "loss": 0.0196, "step": 44280 }, { "epoch": 0.48, "learning_rate": 0.0002281799312447298, "loss": 0.0202, "step": 44290 }, { "epoch": 0.48, "learning_rate": 0.00022816371537912693, "loss": 0.0211, "step": 44300 }, { "epoch": 0.48, "learning_rate": 0.00022814749951352402, "loss": 0.0241, "step": 44310 }, { "epoch": 0.48, "learning_rate": 0.00022813128364792108, "loss": 0.0193, "step": 44320 }, { "epoch": 0.48, "learning_rate": 0.0002281150677823182, "loss": 0.0216, "step": 44330 }, { "epoch": 0.48, "learning_rate": 0.0002280988519167153, "loss": 0.0201, "step": 44340 }, { "epoch": 0.48, "learning_rate": 0.0002280826360511124, "loss": 0.024, "step": 44350 }, { "epoch": 0.48, "learning_rate": 0.00022806642018550946, "loss": 0.021, "step": 44360 }, { "epoch": 0.48, "learning_rate": 0.00022805020431990658, "loss": 0.0206, "step": 44370 }, { "epoch": 0.48, "learning_rate": 0.00022803398845430367, "loss": 0.0165, "step": 44380 }, { "epoch": 0.48, "learning_rate": 0.0002280177725887008, "loss": 0.0221, "step": 44390 }, { "epoch": 0.48, "learning_rate": 0.00022800155672309785, "loss": 0.0185, "step": 44400 }, { "epoch": 0.48, "learning_rate": 0.00022798534085749495, "loss": 0.0195, "step": 44410 }, { "epoch": 0.48, "learning_rate": 0.00022796912499189204, "loss": 0.0186, "step": 44420 }, { "epoch": 0.48, "learning_rate": 0.00022795290912628916, "loss": 0.0198, "step": 44430 }, { "epoch": 0.48, "learning_rate": 0.00022793669326068622, "loss": 0.0206, "step": 44440 }, { "epoch": 0.48, "learning_rate": 0.00022792047739508332, "loss": 0.0195, "step": 44450 }, { "epoch": 0.48, "learning_rate": 0.00022790426152948044, "loss": 0.0159, "step": 44460 }, { "epoch": 0.48, "learning_rate": 0.00022788804566387753, "loss": 0.0185, "step": 44470 }, { "epoch": 0.48, "learning_rate": 0.0002278718297982746, "loss": 0.0195, "step": 44480 }, { "epoch": 0.48, "learning_rate": 0.0002278556139326717, "loss": 0.0185, "step": 44490 }, { "epoch": 0.48, "learning_rate": 0.0002278393980670688, "loss": 0.0205, "step": 44500 }, { "epoch": 0.48, "learning_rate": 0.0002278231822014659, "loss": 0.0163, "step": 44510 }, { "epoch": 0.48, "learning_rate": 0.00022780696633586297, "loss": 0.0203, "step": 44520 }, { "epoch": 0.48, "learning_rate": 0.00022779075047026009, "loss": 0.0207, "step": 44530 }, { "epoch": 0.48, "learning_rate": 0.00022777453460465718, "loss": 0.0196, "step": 44540 }, { "epoch": 0.48, "learning_rate": 0.00022775831873905427, "loss": 0.0209, "step": 44550 }, { "epoch": 0.48, "learning_rate": 0.00022774210287345134, "loss": 0.0239, "step": 44560 }, { "epoch": 0.48, "learning_rate": 0.00022772588700784846, "loss": 0.0177, "step": 44570 }, { "epoch": 0.48, "learning_rate": 0.00022770967114224555, "loss": 0.0194, "step": 44580 }, { "epoch": 0.48, "learning_rate": 0.00022769345527664264, "loss": 0.0195, "step": 44590 }, { "epoch": 0.48, "learning_rate": 0.00022767723941103976, "loss": 0.0171, "step": 44600 }, { "epoch": 0.48, "learning_rate": 0.00022766102354543683, "loss": 0.019, "step": 44610 }, { "epoch": 0.48, "learning_rate": 0.00022764480767983392, "loss": 0.0165, "step": 44620 }, { "epoch": 0.48, "learning_rate": 0.00022762859181423104, "loss": 0.02, "step": 44630 }, { "epoch": 0.48, "learning_rate": 0.00022761237594862813, "loss": 0.0192, "step": 44640 }, { "epoch": 0.48, "learning_rate": 0.0002275961600830252, "loss": 0.0193, "step": 44650 }, { "epoch": 0.48, "learning_rate": 0.00022757994421742232, "loss": 0.0187, "step": 44660 }, { "epoch": 0.48, "learning_rate": 0.0002275637283518194, "loss": 0.0177, "step": 44670 }, { "epoch": 0.48, "learning_rate": 0.0002275475124862165, "loss": 0.0201, "step": 44680 }, { "epoch": 0.48, "learning_rate": 0.00022753129662061357, "loss": 0.0209, "step": 44690 }, { "epoch": 0.48, "learning_rate": 0.0002275150807550107, "loss": 0.0171, "step": 44700 }, { "epoch": 0.48, "learning_rate": 0.00022749886488940778, "loss": 0.023, "step": 44710 }, { "epoch": 0.48, "learning_rate": 0.00022748264902380488, "loss": 0.0199, "step": 44720 }, { "epoch": 0.48, "learning_rate": 0.00022746643315820197, "loss": 0.0167, "step": 44730 }, { "epoch": 0.48, "learning_rate": 0.00022745021729259906, "loss": 0.0214, "step": 44740 }, { "epoch": 0.48, "learning_rate": 0.00022743400142699615, "loss": 0.0187, "step": 44750 }, { "epoch": 0.48, "learning_rate": 0.00022741778556139327, "loss": 0.0157, "step": 44760 }, { "epoch": 0.48, "learning_rate": 0.00022740156969579034, "loss": 0.0204, "step": 44770 }, { "epoch": 0.48, "learning_rate": 0.00022738535383018743, "loss": 0.0212, "step": 44780 }, { "epoch": 0.48, "learning_rate": 0.00022736913796458452, "loss": 0.0212, "step": 44790 }, { "epoch": 0.48, "learning_rate": 0.00022735292209898164, "loss": 0.0196, "step": 44800 }, { "epoch": 0.48, "learning_rate": 0.0002273367062333787, "loss": 0.0191, "step": 44810 }, { "epoch": 0.48, "learning_rate": 0.0002273204903677758, "loss": 0.0232, "step": 44820 }, { "epoch": 0.48, "learning_rate": 0.00022730427450217292, "loss": 0.0179, "step": 44830 }, { "epoch": 0.48, "learning_rate": 0.00022728805863657002, "loss": 0.0199, "step": 44840 }, { "epoch": 0.48, "learning_rate": 0.00022727184277096708, "loss": 0.0162, "step": 44850 }, { "epoch": 0.48, "learning_rate": 0.00022725562690536417, "loss": 0.0215, "step": 44860 }, { "epoch": 0.49, "learning_rate": 0.0002272394110397613, "loss": 0.0179, "step": 44870 }, { "epoch": 0.49, "learning_rate": 0.00022722319517415839, "loss": 0.0186, "step": 44880 }, { "epoch": 0.49, "learning_rate": 0.00022720697930855545, "loss": 0.0215, "step": 44890 }, { "epoch": 0.49, "learning_rate": 0.00022719076344295257, "loss": 0.0169, "step": 44900 }, { "epoch": 0.49, "learning_rate": 0.00022717454757734966, "loss": 0.0204, "step": 44910 }, { "epoch": 0.49, "learning_rate": 0.00022715833171174676, "loss": 0.0208, "step": 44920 }, { "epoch": 0.49, "learning_rate": 0.00022714211584614382, "loss": 0.0183, "step": 44930 }, { "epoch": 0.49, "learning_rate": 0.00022712589998054094, "loss": 0.0188, "step": 44940 }, { "epoch": 0.49, "learning_rate": 0.00022710968411493804, "loss": 0.0155, "step": 44950 }, { "epoch": 0.49, "learning_rate": 0.00022709346824933516, "loss": 0.0175, "step": 44960 }, { "epoch": 0.49, "learning_rate": 0.00022707725238373222, "loss": 0.0177, "step": 44970 }, { "epoch": 0.49, "learning_rate": 0.00022706103651812931, "loss": 0.0166, "step": 44980 }, { "epoch": 0.49, "learning_rate": 0.0002270448206525264, "loss": 0.0189, "step": 44990 }, { "epoch": 0.49, "learning_rate": 0.00022702860478692353, "loss": 0.0161, "step": 45000 }, { "epoch": 0.49, "eval_cer": 0.9215347519356817, "eval_loss": 0.013409956358373165, "eval_runtime": 121.5929, "eval_samples_per_second": 16.448, "eval_steps_per_second": 4.112, "step": 45000 }, { "epoch": 0.49, "learning_rate": 0.0002270123889213206, "loss": 0.0199, "step": 45010 }, { "epoch": 0.49, "learning_rate": 0.00022699617305571768, "loss": 0.0178, "step": 45020 }, { "epoch": 0.49, "learning_rate": 0.0002269799571901148, "loss": 0.0182, "step": 45030 }, { "epoch": 0.49, "learning_rate": 0.0002269637413245119, "loss": 0.0164, "step": 45040 }, { "epoch": 0.49, "learning_rate": 0.00022694752545890896, "loss": 0.0169, "step": 45050 }, { "epoch": 0.49, "learning_rate": 0.00022693130959330606, "loss": 0.0204, "step": 45060 }, { "epoch": 0.49, "learning_rate": 0.00022691509372770318, "loss": 0.0177, "step": 45070 }, { "epoch": 0.49, "learning_rate": 0.00022689887786210027, "loss": 0.0185, "step": 45080 }, { "epoch": 0.49, "learning_rate": 0.00022688266199649733, "loss": 0.0174, "step": 45090 }, { "epoch": 0.49, "learning_rate": 0.00022686644613089445, "loss": 0.0201, "step": 45100 }, { "epoch": 0.49, "learning_rate": 0.00022685023026529155, "loss": 0.0195, "step": 45110 }, { "epoch": 0.49, "learning_rate": 0.00022683401439968864, "loss": 0.0185, "step": 45120 }, { "epoch": 0.49, "learning_rate": 0.0002268177985340857, "loss": 0.0179, "step": 45130 }, { "epoch": 0.49, "learning_rate": 0.00022680158266848282, "loss": 0.0163, "step": 45140 }, { "epoch": 0.49, "learning_rate": 0.00022678536680287992, "loss": 0.0163, "step": 45150 }, { "epoch": 0.49, "learning_rate": 0.000226769150937277, "loss": 0.0193, "step": 45160 }, { "epoch": 0.49, "learning_rate": 0.0002267529350716741, "loss": 0.0188, "step": 45170 }, { "epoch": 0.49, "learning_rate": 0.0002267367192060712, "loss": 0.0184, "step": 45180 }, { "epoch": 0.49, "learning_rate": 0.0002267205033404683, "loss": 0.0221, "step": 45190 }, { "epoch": 0.49, "learning_rate": 0.0002267042874748654, "loss": 0.0206, "step": 45200 }, { "epoch": 0.49, "learning_rate": 0.00022668807160926247, "loss": 0.0174, "step": 45210 }, { "epoch": 0.49, "learning_rate": 0.00022667185574365957, "loss": 0.0188, "step": 45220 }, { "epoch": 0.49, "learning_rate": 0.00022665563987805666, "loss": 0.0233, "step": 45230 }, { "epoch": 0.49, "learning_rate": 0.00022663942401245378, "loss": 0.0189, "step": 45240 }, { "epoch": 0.49, "learning_rate": 0.00022662320814685084, "loss": 0.021, "step": 45250 }, { "epoch": 0.49, "learning_rate": 0.00022660699228124794, "loss": 0.0203, "step": 45260 }, { "epoch": 0.49, "learning_rate": 0.00022659077641564506, "loss": 0.0207, "step": 45270 }, { "epoch": 0.49, "learning_rate": 0.00022657456055004215, "loss": 0.0179, "step": 45280 }, { "epoch": 0.49, "learning_rate": 0.00022655834468443922, "loss": 0.0168, "step": 45290 }, { "epoch": 0.49, "learning_rate": 0.0002265421288188363, "loss": 0.0172, "step": 45300 }, { "epoch": 0.49, "learning_rate": 0.00022652591295323343, "loss": 0.0161, "step": 45310 }, { "epoch": 0.49, "learning_rate": 0.00022650969708763052, "loss": 0.0215, "step": 45320 }, { "epoch": 0.49, "learning_rate": 0.00022649348122202764, "loss": 0.0179, "step": 45330 }, { "epoch": 0.49, "learning_rate": 0.0002264772653564247, "loss": 0.0183, "step": 45340 }, { "epoch": 0.49, "learning_rate": 0.0002264610494908218, "loss": 0.0177, "step": 45350 }, { "epoch": 0.49, "learning_rate": 0.0002264448336252189, "loss": 0.0173, "step": 45360 }, { "epoch": 0.49, "learning_rate": 0.000226428617759616, "loss": 0.0181, "step": 45370 }, { "epoch": 0.49, "learning_rate": 0.00022641240189401308, "loss": 0.0181, "step": 45380 }, { "epoch": 0.49, "learning_rate": 0.00022639618602841017, "loss": 0.0266, "step": 45390 }, { "epoch": 0.49, "learning_rate": 0.0002263799701628073, "loss": 0.0196, "step": 45400 }, { "epoch": 0.49, "learning_rate": 0.00022636375429720438, "loss": 0.0189, "step": 45410 }, { "epoch": 0.49, "learning_rate": 0.00022634753843160145, "loss": 0.0191, "step": 45420 }, { "epoch": 0.49, "learning_rate": 0.00022633132256599854, "loss": 0.0219, "step": 45430 }, { "epoch": 0.49, "learning_rate": 0.00022631510670039566, "loss": 0.0182, "step": 45440 }, { "epoch": 0.49, "learning_rate": 0.00022629889083479275, "loss": 0.0213, "step": 45450 }, { "epoch": 0.49, "learning_rate": 0.00022628267496918982, "loss": 0.0172, "step": 45460 }, { "epoch": 0.49, "learning_rate": 0.00022626645910358694, "loss": 0.0191, "step": 45470 }, { "epoch": 0.49, "learning_rate": 0.00022625024323798403, "loss": 0.0182, "step": 45480 }, { "epoch": 0.49, "learning_rate": 0.00022623402737238112, "loss": 0.0199, "step": 45490 }, { "epoch": 0.49, "learning_rate": 0.0002262178115067782, "loss": 0.0197, "step": 45500 }, { "epoch": 0.49, "learning_rate": 0.0002262015956411753, "loss": 0.0196, "step": 45510 }, { "epoch": 0.49, "learning_rate": 0.0002261853797755724, "loss": 0.0203, "step": 45520 }, { "epoch": 0.49, "learning_rate": 0.0002261691639099695, "loss": 0.0178, "step": 45530 }, { "epoch": 0.49, "learning_rate": 0.0002261529480443666, "loss": 0.017, "step": 45540 }, { "epoch": 0.49, "learning_rate": 0.00022613673217876368, "loss": 0.0181, "step": 45550 }, { "epoch": 0.49, "learning_rate": 0.00022612051631316077, "loss": 0.0201, "step": 45560 }, { "epoch": 0.49, "learning_rate": 0.0002261043004475579, "loss": 0.0212, "step": 45570 }, { "epoch": 0.49, "learning_rate": 0.00022608808458195496, "loss": 0.0153, "step": 45580 }, { "epoch": 0.49, "learning_rate": 0.00022607186871635205, "loss": 0.0192, "step": 45590 }, { "epoch": 0.49, "learning_rate": 0.00022605565285074915, "loss": 0.0173, "step": 45600 }, { "epoch": 0.49, "learning_rate": 0.00022603943698514626, "loss": 0.0174, "step": 45610 }, { "epoch": 0.49, "learning_rate": 0.00022602322111954333, "loss": 0.0215, "step": 45620 }, { "epoch": 0.49, "learning_rate": 0.00022600700525394042, "loss": 0.0235, "step": 45630 }, { "epoch": 0.49, "learning_rate": 0.00022599078938833754, "loss": 0.0201, "step": 45640 }, { "epoch": 0.49, "learning_rate": 0.00022597457352273464, "loss": 0.0183, "step": 45650 }, { "epoch": 0.49, "learning_rate": 0.0002259583576571317, "loss": 0.0194, "step": 45660 }, { "epoch": 0.49, "learning_rate": 0.00022594214179152882, "loss": 0.0201, "step": 45670 }, { "epoch": 0.49, "learning_rate": 0.00022592592592592591, "loss": 0.0193, "step": 45680 }, { "epoch": 0.49, "learning_rate": 0.000225909710060323, "loss": 0.0172, "step": 45690 }, { "epoch": 0.49, "learning_rate": 0.00022589349419472007, "loss": 0.0171, "step": 45700 }, { "epoch": 0.49, "learning_rate": 0.0002258772783291172, "loss": 0.0171, "step": 45710 }, { "epoch": 0.49, "learning_rate": 0.00022586106246351429, "loss": 0.0153, "step": 45720 }, { "epoch": 0.49, "learning_rate": 0.00022584484659791138, "loss": 0.0179, "step": 45730 }, { "epoch": 0.49, "learning_rate": 0.00022582863073230847, "loss": 0.0163, "step": 45740 }, { "epoch": 0.49, "learning_rate": 0.00022581241486670556, "loss": 0.0178, "step": 45750 }, { "epoch": 0.49, "learning_rate": 0.00022579619900110266, "loss": 0.0162, "step": 45760 }, { "epoch": 0.49, "learning_rate": 0.00022577998313549978, "loss": 0.0202, "step": 45770 }, { "epoch": 0.49, "learning_rate": 0.00022576376726989684, "loss": 0.0189, "step": 45780 }, { "epoch": 0.5, "learning_rate": 0.00022574755140429393, "loss": 0.0211, "step": 45790 }, { "epoch": 0.5, "learning_rate": 0.00022573133553869103, "loss": 0.0197, "step": 45800 }, { "epoch": 0.5, "learning_rate": 0.00022571511967308815, "loss": 0.02, "step": 45810 }, { "epoch": 0.5, "learning_rate": 0.0002256989038074852, "loss": 0.0177, "step": 45820 }, { "epoch": 0.5, "learning_rate": 0.0002256826879418823, "loss": 0.0183, "step": 45830 }, { "epoch": 0.5, "learning_rate": 0.00022566647207627943, "loss": 0.0167, "step": 45840 }, { "epoch": 0.5, "learning_rate": 0.00022565025621067652, "loss": 0.0185, "step": 45850 }, { "epoch": 0.5, "learning_rate": 0.00022563404034507358, "loss": 0.0257, "step": 45860 }, { "epoch": 0.5, "learning_rate": 0.00022561782447947068, "loss": 0.0202, "step": 45870 }, { "epoch": 0.5, "learning_rate": 0.0002256016086138678, "loss": 0.0186, "step": 45880 }, { "epoch": 0.5, "learning_rate": 0.0002255853927482649, "loss": 0.0203, "step": 45890 }, { "epoch": 0.5, "learning_rate": 0.00022556917688266195, "loss": 0.0203, "step": 45900 }, { "epoch": 0.5, "learning_rate": 0.00022555296101705907, "loss": 0.0194, "step": 45910 }, { "epoch": 0.5, "learning_rate": 0.00022553674515145617, "loss": 0.0217, "step": 45920 }, { "epoch": 0.5, "learning_rate": 0.00022552052928585326, "loss": 0.0186, "step": 45930 }, { "epoch": 0.5, "learning_rate": 0.00022550431342025033, "loss": 0.0192, "step": 45940 }, { "epoch": 0.5, "learning_rate": 0.00022548809755464745, "loss": 0.0229, "step": 45950 }, { "epoch": 0.5, "learning_rate": 0.00022547188168904454, "loss": 0.0189, "step": 45960 }, { "epoch": 0.5, "learning_rate": 0.00022545566582344166, "loss": 0.0167, "step": 45970 }, { "epoch": 0.5, "learning_rate": 0.00022543944995783872, "loss": 0.0171, "step": 45980 }, { "epoch": 0.5, "learning_rate": 0.00022542323409223582, "loss": 0.021, "step": 45990 }, { "epoch": 0.5, "learning_rate": 0.0002254070182266329, "loss": 0.0172, "step": 46000 }, { "epoch": 0.5, "eval_cer": 0.9215503867888964, "eval_loss": 0.01366225816309452, "eval_runtime": 121.4419, "eval_samples_per_second": 16.469, "eval_steps_per_second": 4.117, "step": 46000 }, { "epoch": 0.5, "learning_rate": 0.00022539080236103003, "loss": 0.0189, "step": 46010 }, { "epoch": 0.5, "learning_rate": 0.0002253745864954271, "loss": 0.0161, "step": 46020 }, { "epoch": 0.5, "learning_rate": 0.0002253583706298242, "loss": 0.0206, "step": 46030 }, { "epoch": 0.5, "learning_rate": 0.0002253421547642213, "loss": 0.0199, "step": 46040 }, { "epoch": 0.5, "learning_rate": 0.0002253259388986184, "loss": 0.0169, "step": 46050 }, { "epoch": 0.5, "learning_rate": 0.0002253097230330155, "loss": 0.0192, "step": 46060 }, { "epoch": 0.5, "learning_rate": 0.00022529350716741256, "loss": 0.0192, "step": 46070 }, { "epoch": 0.5, "learning_rate": 0.00022527729130180968, "loss": 0.019, "step": 46080 }, { "epoch": 0.5, "learning_rate": 0.00022526107543620677, "loss": 0.0179, "step": 46090 }, { "epoch": 0.5, "learning_rate": 0.00022524485957060386, "loss": 0.0202, "step": 46100 }, { "epoch": 0.5, "learning_rate": 0.00022522864370500096, "loss": 0.0198, "step": 46110 }, { "epoch": 0.5, "learning_rate": 0.00022521242783939805, "loss": 0.0194, "step": 46120 }, { "epoch": 0.5, "learning_rate": 0.00022519621197379514, "loss": 0.0219, "step": 46130 }, { "epoch": 0.5, "learning_rate": 0.00022517999610819226, "loss": 0.0175, "step": 46140 }, { "epoch": 0.5, "learning_rate": 0.00022516378024258933, "loss": 0.0191, "step": 46150 }, { "epoch": 0.5, "learning_rate": 0.00022514756437698642, "loss": 0.0167, "step": 46160 }, { "epoch": 0.5, "learning_rate": 0.0002251313485113835, "loss": 0.015, "step": 46170 }, { "epoch": 0.5, "learning_rate": 0.00022511513264578063, "loss": 0.0188, "step": 46180 }, { "epoch": 0.5, "learning_rate": 0.0002250989167801777, "loss": 0.0182, "step": 46190 }, { "epoch": 0.5, "learning_rate": 0.0002250827009145748, "loss": 0.0201, "step": 46200 }, { "epoch": 0.5, "learning_rate": 0.0002250664850489719, "loss": 0.0209, "step": 46210 }, { "epoch": 0.5, "learning_rate": 0.000225050269183369, "loss": 0.0174, "step": 46220 }, { "epoch": 0.5, "learning_rate": 0.00022503405331776607, "loss": 0.017, "step": 46230 }, { "epoch": 0.5, "learning_rate": 0.00022501783745216316, "loss": 0.0195, "step": 46240 }, { "epoch": 0.5, "learning_rate": 0.00022500162158656028, "loss": 0.0169, "step": 46250 }, { "epoch": 0.5, "learning_rate": 0.00022498540572095737, "loss": 0.0167, "step": 46260 }, { "epoch": 0.5, "learning_rate": 0.00022496918985535444, "loss": 0.0178, "step": 46270 }, { "epoch": 0.5, "learning_rate": 0.00022495297398975156, "loss": 0.0162, "step": 46280 }, { "epoch": 0.5, "learning_rate": 0.00022493675812414865, "loss": 0.0168, "step": 46290 }, { "epoch": 0.5, "learning_rate": 0.00022492054225854575, "loss": 0.0219, "step": 46300 }, { "epoch": 0.5, "learning_rate": 0.0002249043263929428, "loss": 0.019, "step": 46310 }, { "epoch": 0.5, "learning_rate": 0.00022488811052733993, "loss": 0.0209, "step": 46320 }, { "epoch": 0.5, "learning_rate": 0.00022487189466173702, "loss": 0.0198, "step": 46330 }, { "epoch": 0.5, "learning_rate": 0.00022485567879613414, "loss": 0.0229, "step": 46340 }, { "epoch": 0.5, "learning_rate": 0.0002248394629305312, "loss": 0.0156, "step": 46350 }, { "epoch": 0.5, "learning_rate": 0.0002248232470649283, "loss": 0.0167, "step": 46360 }, { "epoch": 0.5, "learning_rate": 0.0002248070311993254, "loss": 0.0219, "step": 46370 }, { "epoch": 0.5, "learning_rate": 0.00022479081533372251, "loss": 0.0213, "step": 46380 }, { "epoch": 0.5, "learning_rate": 0.00022477459946811958, "loss": 0.0199, "step": 46390 }, { "epoch": 0.5, "learning_rate": 0.00022475838360251667, "loss": 0.0202, "step": 46400 }, { "epoch": 0.5, "learning_rate": 0.0002247421677369138, "loss": 0.0328, "step": 46410 }, { "epoch": 0.5, "learning_rate": 0.00022472595187131089, "loss": 0.0231, "step": 46420 }, { "epoch": 0.5, "learning_rate": 0.00022470973600570795, "loss": 0.0206, "step": 46430 }, { "epoch": 0.5, "learning_rate": 0.00022469352014010504, "loss": 0.0189, "step": 46440 }, { "epoch": 0.5, "learning_rate": 0.00022467730427450216, "loss": 0.0179, "step": 46450 }, { "epoch": 0.5, "learning_rate": 0.00022466108840889926, "loss": 0.014, "step": 46460 }, { "epoch": 0.5, "learning_rate": 0.00022464487254329632, "loss": 0.0178, "step": 46470 }, { "epoch": 0.5, "learning_rate": 0.00022462865667769344, "loss": 0.0186, "step": 46480 }, { "epoch": 0.5, "learning_rate": 0.00022461244081209053, "loss": 0.0181, "step": 46490 }, { "epoch": 0.5, "learning_rate": 0.00022459622494648763, "loss": 0.019, "step": 46500 }, { "epoch": 0.5, "learning_rate": 0.0002245800090808847, "loss": 0.019, "step": 46510 }, { "epoch": 0.5, "learning_rate": 0.0002245637932152818, "loss": 0.0232, "step": 46520 }, { "epoch": 0.5, "learning_rate": 0.0002245475773496789, "loss": 0.0207, "step": 46530 }, { "epoch": 0.5, "learning_rate": 0.000224531361484076, "loss": 0.0199, "step": 46540 }, { "epoch": 0.5, "learning_rate": 0.0002245151456184731, "loss": 0.0177, "step": 46550 }, { "epoch": 0.5, "learning_rate": 0.00022449892975287018, "loss": 0.0179, "step": 46560 }, { "epoch": 0.5, "learning_rate": 0.00022448271388726728, "loss": 0.0259, "step": 46570 }, { "epoch": 0.5, "learning_rate": 0.0002244664980216644, "loss": 0.0185, "step": 46580 }, { "epoch": 0.5, "learning_rate": 0.00022445028215606146, "loss": 0.0188, "step": 46590 }, { "epoch": 0.5, "learning_rate": 0.00022443406629045855, "loss": 0.0315, "step": 46600 }, { "epoch": 0.5, "learning_rate": 0.00022441785042485565, "loss": 0.0219, "step": 46610 }, { "epoch": 0.5, "learning_rate": 0.00022440163455925277, "loss": 0.0223, "step": 46620 }, { "epoch": 0.5, "learning_rate": 0.00022438541869364983, "loss": 0.0226, "step": 46630 }, { "epoch": 0.5, "learning_rate": 0.00022436920282804693, "loss": 0.0226, "step": 46640 }, { "epoch": 0.5, "learning_rate": 0.00022435298696244405, "loss": 0.0219, "step": 46650 }, { "epoch": 0.5, "learning_rate": 0.00022433677109684114, "loss": 0.0183, "step": 46660 }, { "epoch": 0.5, "learning_rate": 0.0002243205552312382, "loss": 0.0176, "step": 46670 }, { "epoch": 0.5, "learning_rate": 0.00022430433936563532, "loss": 0.021, "step": 46680 }, { "epoch": 0.5, "learning_rate": 0.00022428812350003242, "loss": 0.0206, "step": 46690 }, { "epoch": 0.5, "learning_rate": 0.0002242719076344295, "loss": 0.016, "step": 46700 }, { "epoch": 0.5, "learning_rate": 0.00022425569176882658, "loss": 0.0217, "step": 46710 }, { "epoch": 0.51, "learning_rate": 0.0002242394759032237, "loss": 0.0183, "step": 46720 }, { "epoch": 0.51, "learning_rate": 0.0002242232600376208, "loss": 0.0177, "step": 46730 }, { "epoch": 0.51, "learning_rate": 0.00022420704417201788, "loss": 0.0179, "step": 46740 }, { "epoch": 0.51, "learning_rate": 0.00022419082830641497, "loss": 0.0174, "step": 46750 }, { "epoch": 0.51, "learning_rate": 0.00022417461244081207, "loss": 0.0158, "step": 46760 }, { "epoch": 0.51, "learning_rate": 0.00022415839657520916, "loss": 0.0208, "step": 46770 }, { "epoch": 0.51, "learning_rate": 0.00022414218070960628, "loss": 0.0206, "step": 46780 }, { "epoch": 0.51, "learning_rate": 0.00022412596484400337, "loss": 0.0248, "step": 46790 }, { "epoch": 0.51, "learning_rate": 0.00022410974897840044, "loss": 0.0181, "step": 46800 }, { "epoch": 0.51, "learning_rate": 0.00022409353311279753, "loss": 0.0205, "step": 46810 }, { "epoch": 0.51, "learning_rate": 0.00022407731724719465, "loss": 0.0183, "step": 46820 }, { "epoch": 0.51, "learning_rate": 0.00022406110138159174, "loss": 0.02, "step": 46830 }, { "epoch": 0.51, "learning_rate": 0.0002240448855159888, "loss": 0.0215, "step": 46840 }, { "epoch": 0.51, "learning_rate": 0.00022402866965038593, "loss": 0.0177, "step": 46850 }, { "epoch": 0.51, "learning_rate": 0.00022401245378478302, "loss": 0.0167, "step": 46860 }, { "epoch": 0.51, "learning_rate": 0.0002239962379191801, "loss": 0.016, "step": 46870 }, { "epoch": 0.51, "learning_rate": 0.00022398002205357718, "loss": 0.0157, "step": 46880 }, { "epoch": 0.51, "learning_rate": 0.0002239638061879743, "loss": 0.0174, "step": 46890 }, { "epoch": 0.51, "learning_rate": 0.0002239475903223714, "loss": 0.0174, "step": 46900 }, { "epoch": 0.51, "learning_rate": 0.00022393137445676848, "loss": 0.0183, "step": 46910 }, { "epoch": 0.51, "learning_rate": 0.00022391515859116558, "loss": 0.0173, "step": 46920 }, { "epoch": 0.51, "learning_rate": 0.00022389894272556267, "loss": 0.0195, "step": 46930 }, { "epoch": 0.51, "learning_rate": 0.00022388272685995976, "loss": 0.0193, "step": 46940 }, { "epoch": 0.51, "learning_rate": 0.00022386651099435688, "loss": 0.0201, "step": 46950 }, { "epoch": 0.51, "learning_rate": 0.00022385029512875395, "loss": 0.0161, "step": 46960 }, { "epoch": 0.51, "learning_rate": 0.00022383407926315104, "loss": 0.0166, "step": 46970 }, { "epoch": 0.51, "learning_rate": 0.00022381786339754816, "loss": 0.0193, "step": 46980 }, { "epoch": 0.51, "learning_rate": 0.00022380164753194525, "loss": 0.0153, "step": 46990 }, { "epoch": 0.51, "learning_rate": 0.00022378543166634232, "loss": 0.0199, "step": 47000 }, { "epoch": 0.51, "eval_cer": 0.9215434379652454, "eval_loss": 0.013291054405272007, "eval_runtime": 121.5822, "eval_samples_per_second": 16.45, "eval_steps_per_second": 4.112, "step": 47000 }, { "epoch": 0.51, "learning_rate": 0.0002237692158007394, "loss": 0.02, "step": 47010 }, { "epoch": 0.51, "learning_rate": 0.00022375299993513653, "loss": 0.0203, "step": 47020 }, { "epoch": 0.51, "learning_rate": 0.00022373678406953362, "loss": 0.0192, "step": 47030 }, { "epoch": 0.51, "learning_rate": 0.0002237205682039307, "loss": 0.0214, "step": 47040 }, { "epoch": 0.51, "learning_rate": 0.0002237043523383278, "loss": 0.0159, "step": 47050 }, { "epoch": 0.51, "learning_rate": 0.0002236881364727249, "loss": 0.0195, "step": 47060 }, { "epoch": 0.51, "learning_rate": 0.000223671920607122, "loss": 0.0229, "step": 47070 }, { "epoch": 0.51, "learning_rate": 0.00022365570474151906, "loss": 0.0148, "step": 47080 }, { "epoch": 0.51, "learning_rate": 0.00022363948887591618, "loss": 0.0208, "step": 47090 }, { "epoch": 0.51, "learning_rate": 0.00022362327301031327, "loss": 0.0177, "step": 47100 }, { "epoch": 0.51, "learning_rate": 0.00022360705714471037, "loss": 0.0182, "step": 47110 }, { "epoch": 0.51, "learning_rate": 0.00022359084127910746, "loss": 0.0186, "step": 47120 }, { "epoch": 0.51, "learning_rate": 0.00022357462541350455, "loss": 0.017, "step": 47130 }, { "epoch": 0.51, "learning_rate": 0.00022355840954790164, "loss": 0.0192, "step": 47140 }, { "epoch": 0.51, "learning_rate": 0.00022354219368229876, "loss": 0.0179, "step": 47150 }, { "epoch": 0.51, "learning_rate": 0.00022352597781669583, "loss": 0.0178, "step": 47160 }, { "epoch": 0.51, "learning_rate": 0.00022350976195109292, "loss": 0.021, "step": 47170 }, { "epoch": 0.51, "learning_rate": 0.00022349354608549002, "loss": 0.02, "step": 47180 }, { "epoch": 0.51, "learning_rate": 0.00022347733021988714, "loss": 0.0223, "step": 47190 }, { "epoch": 0.51, "learning_rate": 0.0002234611143542842, "loss": 0.0199, "step": 47200 }, { "epoch": 0.51, "learning_rate": 0.0002234448984886813, "loss": 0.0187, "step": 47210 }, { "epoch": 0.51, "learning_rate": 0.0002234286826230784, "loss": 0.0197, "step": 47220 }, { "epoch": 0.51, "learning_rate": 0.0002234124667574755, "loss": 0.0179, "step": 47230 }, { "epoch": 0.51, "learning_rate": 0.00022339625089187257, "loss": 0.0216, "step": 47240 }, { "epoch": 0.51, "learning_rate": 0.00022338003502626966, "loss": 0.02, "step": 47250 }, { "epoch": 0.51, "learning_rate": 0.00022336381916066678, "loss": 0.0207, "step": 47260 }, { "epoch": 0.51, "learning_rate": 0.00022334760329506388, "loss": 0.0184, "step": 47270 }, { "epoch": 0.51, "learning_rate": 0.00022333138742946094, "loss": 0.0201, "step": 47280 }, { "epoch": 0.51, "learning_rate": 0.00022331517156385806, "loss": 0.0187, "step": 47290 }, { "epoch": 0.51, "learning_rate": 0.00022329895569825516, "loss": 0.0194, "step": 47300 }, { "epoch": 0.51, "learning_rate": 0.00022328273983265225, "loss": 0.0154, "step": 47310 }, { "epoch": 0.51, "learning_rate": 0.00022326652396704931, "loss": 0.0196, "step": 47320 }, { "epoch": 0.51, "learning_rate": 0.00022325030810144643, "loss": 0.0167, "step": 47330 }, { "epoch": 0.51, "learning_rate": 0.00022323409223584353, "loss": 0.019, "step": 47340 }, { "epoch": 0.51, "learning_rate": 0.00022321787637024065, "loss": 0.0224, "step": 47350 }, { "epoch": 0.51, "learning_rate": 0.0002232016605046377, "loss": 0.0185, "step": 47360 }, { "epoch": 0.51, "learning_rate": 0.0002231854446390348, "loss": 0.0181, "step": 47370 }, { "epoch": 0.51, "learning_rate": 0.0002231692287734319, "loss": 0.0184, "step": 47380 }, { "epoch": 0.51, "learning_rate": 0.00022315301290782902, "loss": 0.0169, "step": 47390 }, { "epoch": 0.51, "learning_rate": 0.00022313679704222608, "loss": 0.0173, "step": 47400 }, { "epoch": 0.51, "learning_rate": 0.00022312058117662318, "loss": 0.0203, "step": 47410 }, { "epoch": 0.51, "learning_rate": 0.0002231043653110203, "loss": 0.0172, "step": 47420 }, { "epoch": 0.51, "learning_rate": 0.0002230881494454174, "loss": 0.0185, "step": 47430 }, { "epoch": 0.51, "learning_rate": 0.00022307193357981445, "loss": 0.0195, "step": 47440 }, { "epoch": 0.51, "learning_rate": 0.00022305571771421155, "loss": 0.0168, "step": 47450 }, { "epoch": 0.51, "learning_rate": 0.00022303950184860867, "loss": 0.0172, "step": 47460 }, { "epoch": 0.51, "learning_rate": 0.00022302328598300576, "loss": 0.0154, "step": 47470 }, { "epoch": 0.51, "learning_rate": 0.00022300707011740285, "loss": 0.0207, "step": 47480 }, { "epoch": 0.51, "learning_rate": 0.00022299085425179994, "loss": 0.0223, "step": 47490 }, { "epoch": 0.51, "learning_rate": 0.00022297463838619704, "loss": 0.0172, "step": 47500 }, { "epoch": 0.51, "learning_rate": 0.00022295842252059413, "loss": 0.0192, "step": 47510 }, { "epoch": 0.51, "learning_rate": 0.00022294220665499125, "loss": 0.0201, "step": 47520 }, { "epoch": 0.51, "learning_rate": 0.00022292599078938832, "loss": 0.0191, "step": 47530 }, { "epoch": 0.51, "learning_rate": 0.0002229097749237854, "loss": 0.0179, "step": 47540 }, { "epoch": 0.51, "learning_rate": 0.0002228935590581825, "loss": 0.0174, "step": 47550 }, { "epoch": 0.51, "learning_rate": 0.00022287734319257962, "loss": 0.0181, "step": 47560 }, { "epoch": 0.51, "learning_rate": 0.0002228611273269767, "loss": 0.0188, "step": 47570 }, { "epoch": 0.51, "learning_rate": 0.00022284491146137378, "loss": 0.0204, "step": 47580 }, { "epoch": 0.51, "learning_rate": 0.0002228286955957709, "loss": 0.0188, "step": 47590 }, { "epoch": 0.51, "learning_rate": 0.000222812479730168, "loss": 0.0154, "step": 47600 }, { "epoch": 0.51, "learning_rate": 0.00022279626386456506, "loss": 0.0195, "step": 47610 }, { "epoch": 0.51, "learning_rate": 0.00022278004799896215, "loss": 0.0177, "step": 47620 }, { "epoch": 0.51, "learning_rate": 0.00022276383213335927, "loss": 0.0163, "step": 47630 }, { "epoch": 0.52, "learning_rate": 0.00022274761626775636, "loss": 0.0176, "step": 47640 }, { "epoch": 0.52, "learning_rate": 0.00022273140040215343, "loss": 0.0158, "step": 47650 }, { "epoch": 0.52, "learning_rate": 0.00022271518453655055, "loss": 0.0206, "step": 47660 }, { "epoch": 0.52, "learning_rate": 0.00022269896867094764, "loss": 0.0177, "step": 47670 }, { "epoch": 0.52, "learning_rate": 0.00022268275280534473, "loss": 0.0172, "step": 47680 }, { "epoch": 0.52, "learning_rate": 0.0002226665369397418, "loss": 0.0192, "step": 47690 }, { "epoch": 0.52, "learning_rate": 0.00022265032107413892, "loss": 0.0188, "step": 47700 }, { "epoch": 0.52, "learning_rate": 0.000222634105208536, "loss": 0.0179, "step": 47710 }, { "epoch": 0.52, "learning_rate": 0.00022261788934293313, "loss": 0.0187, "step": 47720 }, { "epoch": 0.52, "learning_rate": 0.0002226016734773302, "loss": 0.0177, "step": 47730 }, { "epoch": 0.52, "learning_rate": 0.0002225854576117273, "loss": 0.0172, "step": 47740 }, { "epoch": 0.52, "learning_rate": 0.00022256924174612438, "loss": 0.0217, "step": 47750 }, { "epoch": 0.52, "learning_rate": 0.0002225530258805215, "loss": 0.0154, "step": 47760 }, { "epoch": 0.52, "learning_rate": 0.00022253681001491857, "loss": 0.0178, "step": 47770 }, { "epoch": 0.52, "learning_rate": 0.00022252059414931566, "loss": 0.0208, "step": 47780 }, { "epoch": 0.52, "learning_rate": 0.00022250437828371278, "loss": 0.0176, "step": 47790 }, { "epoch": 0.52, "learning_rate": 0.00022248816241810987, "loss": 0.0226, "step": 47800 }, { "epoch": 0.52, "learning_rate": 0.00022247194655250694, "loss": 0.0192, "step": 47810 }, { "epoch": 0.52, "learning_rate": 0.00022245573068690403, "loss": 0.018, "step": 47820 }, { "epoch": 0.52, "learning_rate": 0.00022243951482130115, "loss": 0.0163, "step": 47830 }, { "epoch": 0.52, "learning_rate": 0.00022242329895569824, "loss": 0.0174, "step": 47840 }, { "epoch": 0.52, "learning_rate": 0.0002224070830900953, "loss": 0.0208, "step": 47850 }, { "epoch": 0.52, "learning_rate": 0.00022239086722449243, "loss": 0.0186, "step": 47860 }, { "epoch": 0.52, "learning_rate": 0.00022237465135888952, "loss": 0.0159, "step": 47870 }, { "epoch": 0.52, "learning_rate": 0.00022235843549328662, "loss": 0.0173, "step": 47880 }, { "epoch": 0.52, "learning_rate": 0.00022234221962768368, "loss": 0.0166, "step": 47890 }, { "epoch": 0.52, "learning_rate": 0.0002223260037620808, "loss": 0.0189, "step": 47900 }, { "epoch": 0.52, "learning_rate": 0.0002223097878964779, "loss": 0.0193, "step": 47910 }, { "epoch": 0.52, "learning_rate": 0.000222293572030875, "loss": 0.0196, "step": 47920 }, { "epoch": 0.52, "learning_rate": 0.00022227735616527208, "loss": 0.0188, "step": 47930 }, { "epoch": 0.52, "learning_rate": 0.00022226114029966917, "loss": 0.0222, "step": 47940 }, { "epoch": 0.52, "learning_rate": 0.00022224492443406627, "loss": 0.0184, "step": 47950 }, { "epoch": 0.52, "learning_rate": 0.00022222870856846338, "loss": 0.0187, "step": 47960 }, { "epoch": 0.52, "learning_rate": 0.00022221249270286045, "loss": 0.0181, "step": 47970 }, { "epoch": 0.52, "learning_rate": 0.00022219627683725754, "loss": 0.0188, "step": 47980 }, { "epoch": 0.52, "learning_rate": 0.00022218006097165466, "loss": 0.0218, "step": 47990 }, { "epoch": 0.52, "learning_rate": 0.00022216384510605176, "loss": 0.0211, "step": 48000 }, { "epoch": 0.52, "eval_cer": 0.9215460437741146, "eval_loss": 0.013234671205282211, "eval_runtime": 121.4322, "eval_samples_per_second": 16.47, "eval_steps_per_second": 4.118, "step": 48000 }, { "epoch": 0.52, "learning_rate": 0.00022214762924044882, "loss": 0.0167, "step": 48010 }, { "epoch": 0.52, "learning_rate": 0.00022213141337484591, "loss": 0.0182, "step": 48020 }, { "epoch": 0.52, "learning_rate": 0.00022211519750924303, "loss": 0.0195, "step": 48030 }, { "epoch": 0.52, "learning_rate": 0.00022209898164364013, "loss": 0.0179, "step": 48040 }, { "epoch": 0.52, "learning_rate": 0.0002220827657780372, "loss": 0.0152, "step": 48050 }, { "epoch": 0.52, "learning_rate": 0.0002220665499124343, "loss": 0.0172, "step": 48060 }, { "epoch": 0.52, "learning_rate": 0.0002220503340468314, "loss": 0.018, "step": 48070 }, { "epoch": 0.52, "learning_rate": 0.0002220341181812285, "loss": 0.0173, "step": 48080 }, { "epoch": 0.52, "learning_rate": 0.00022201790231562556, "loss": 0.0187, "step": 48090 }, { "epoch": 0.52, "learning_rate": 0.00022200168645002268, "loss": 0.0184, "step": 48100 }, { "epoch": 0.52, "learning_rate": 0.00022198547058441978, "loss": 0.0182, "step": 48110 }, { "epoch": 0.52, "learning_rate": 0.00022196925471881687, "loss": 0.0173, "step": 48120 }, { "epoch": 0.52, "learning_rate": 0.00022195303885321396, "loss": 0.0187, "step": 48130 }, { "epoch": 0.52, "learning_rate": 0.00022193682298761105, "loss": 0.0181, "step": 48140 }, { "epoch": 0.52, "learning_rate": 0.00022192060712200815, "loss": 0.0169, "step": 48150 }, { "epoch": 0.52, "learning_rate": 0.00022190439125640527, "loss": 0.0201, "step": 48160 }, { "epoch": 0.52, "learning_rate": 0.00022188817539080233, "loss": 0.0168, "step": 48170 }, { "epoch": 0.52, "learning_rate": 0.00022187195952519943, "loss": 0.0187, "step": 48180 }, { "epoch": 0.52, "learning_rate": 0.00022185574365959652, "loss": 0.0211, "step": 48190 }, { "epoch": 0.52, "learning_rate": 0.00022183952779399364, "loss": 0.0175, "step": 48200 }, { "epoch": 0.52, "learning_rate": 0.00022182331192839073, "loss": 0.0199, "step": 48210 }, { "epoch": 0.52, "learning_rate": 0.0002218070960627878, "loss": 0.02, "step": 48220 }, { "epoch": 0.52, "learning_rate": 0.00022179088019718492, "loss": 0.0225, "step": 48230 }, { "epoch": 0.52, "learning_rate": 0.000221774664331582, "loss": 0.0186, "step": 48240 }, { "epoch": 0.52, "learning_rate": 0.0002217584484659791, "loss": 0.0184, "step": 48250 }, { "epoch": 0.52, "learning_rate": 0.00022174223260037617, "loss": 0.0179, "step": 48260 }, { "epoch": 0.52, "learning_rate": 0.0002217260167347733, "loss": 0.0172, "step": 48270 }, { "epoch": 0.52, "learning_rate": 0.00022170980086917038, "loss": 0.0215, "step": 48280 }, { "epoch": 0.52, "learning_rate": 0.0002216935850035675, "loss": 0.0155, "step": 48290 }, { "epoch": 0.52, "learning_rate": 0.00022167736913796457, "loss": 0.0175, "step": 48300 }, { "epoch": 0.52, "learning_rate": 0.00022166115327236166, "loss": 0.0176, "step": 48310 }, { "epoch": 0.52, "learning_rate": 0.00022164493740675875, "loss": 0.016, "step": 48320 }, { "epoch": 0.52, "learning_rate": 0.00022162872154115587, "loss": 0.0175, "step": 48330 }, { "epoch": 0.52, "learning_rate": 0.00022161250567555294, "loss": 0.0191, "step": 48340 }, { "epoch": 0.52, "learning_rate": 0.00022159628980995003, "loss": 0.0193, "step": 48350 }, { "epoch": 0.52, "learning_rate": 0.00022158007394434715, "loss": 0.0172, "step": 48360 }, { "epoch": 0.52, "learning_rate": 0.00022156385807874424, "loss": 0.0208, "step": 48370 }, { "epoch": 0.52, "learning_rate": 0.0002215476422131413, "loss": 0.0168, "step": 48380 }, { "epoch": 0.52, "learning_rate": 0.0002215314263475384, "loss": 0.0171, "step": 48390 }, { "epoch": 0.52, "learning_rate": 0.00022151521048193552, "loss": 0.016, "step": 48400 }, { "epoch": 0.52, "learning_rate": 0.0002214989946163326, "loss": 0.0188, "step": 48410 }, { "epoch": 0.52, "learning_rate": 0.00022148277875072968, "loss": 0.0199, "step": 48420 }, { "epoch": 0.52, "learning_rate": 0.0002214665628851268, "loss": 0.0221, "step": 48430 }, { "epoch": 0.52, "learning_rate": 0.0002214503470195239, "loss": 0.0197, "step": 48440 }, { "epoch": 0.52, "learning_rate": 0.00022143413115392098, "loss": 0.0204, "step": 48450 }, { "epoch": 0.52, "learning_rate": 0.00022141791528831805, "loss": 0.0205, "step": 48460 }, { "epoch": 0.52, "learning_rate": 0.00022140169942271517, "loss": 0.0201, "step": 48470 }, { "epoch": 0.52, "learning_rate": 0.00022138548355711226, "loss": 0.0174, "step": 48480 }, { "epoch": 0.52, "learning_rate": 0.00022136926769150935, "loss": 0.0166, "step": 48490 }, { "epoch": 0.52, "learning_rate": 0.00022135305182590645, "loss": 0.0157, "step": 48500 }, { "epoch": 0.52, "learning_rate": 0.00022133683596030354, "loss": 0.0208, "step": 48510 }, { "epoch": 0.52, "learning_rate": 0.00022132062009470063, "loss": 0.0159, "step": 48520 }, { "epoch": 0.52, "learning_rate": 0.00022130440422909775, "loss": 0.02, "step": 48530 }, { "epoch": 0.52, "learning_rate": 0.00022128818836349482, "loss": 0.0197, "step": 48540 }, { "epoch": 0.52, "learning_rate": 0.0002212719724978919, "loss": 0.0206, "step": 48550 }, { "epoch": 0.52, "learning_rate": 0.000221255756632289, "loss": 0.0189, "step": 48560 }, { "epoch": 0.53, "learning_rate": 0.00022123954076668612, "loss": 0.0193, "step": 48570 }, { "epoch": 0.53, "learning_rate": 0.0002212233249010832, "loss": 0.0186, "step": 48580 }, { "epoch": 0.53, "learning_rate": 0.00022120710903548028, "loss": 0.0166, "step": 48590 }, { "epoch": 0.53, "learning_rate": 0.0002211908931698774, "loss": 0.0204, "step": 48600 }, { "epoch": 0.53, "learning_rate": 0.0002211746773042745, "loss": 0.0209, "step": 48610 }, { "epoch": 0.53, "learning_rate": 0.00022115846143867156, "loss": 0.0204, "step": 48620 }, { "epoch": 0.53, "learning_rate": 0.00022114224557306865, "loss": 0.0162, "step": 48630 }, { "epoch": 0.53, "learning_rate": 0.00022112602970746577, "loss": 0.0148, "step": 48640 }, { "epoch": 0.53, "learning_rate": 0.00022110981384186287, "loss": 0.0186, "step": 48650 }, { "epoch": 0.53, "learning_rate": 0.00022109359797625993, "loss": 0.017, "step": 48660 }, { "epoch": 0.53, "learning_rate": 0.00022107738211065705, "loss": 0.0165, "step": 48670 }, { "epoch": 0.53, "learning_rate": 0.00022106116624505414, "loss": 0.0219, "step": 48680 }, { "epoch": 0.53, "learning_rate": 0.00022104495037945124, "loss": 0.0183, "step": 48690 }, { "epoch": 0.53, "learning_rate": 0.0002210287345138483, "loss": 0.0172, "step": 48700 }, { "epoch": 0.53, "learning_rate": 0.00022101251864824542, "loss": 0.0185, "step": 48710 }, { "epoch": 0.53, "learning_rate": 0.00022099630278264251, "loss": 0.0207, "step": 48720 }, { "epoch": 0.53, "learning_rate": 0.00022098008691703963, "loss": 0.0178, "step": 48730 }, { "epoch": 0.53, "learning_rate": 0.0002209638710514367, "loss": 0.0193, "step": 48740 }, { "epoch": 0.53, "learning_rate": 0.0002209476551858338, "loss": 0.0191, "step": 48750 }, { "epoch": 0.53, "learning_rate": 0.00022093143932023089, "loss": 0.0204, "step": 48760 }, { "epoch": 0.53, "learning_rate": 0.000220915223454628, "loss": 0.0165, "step": 48770 }, { "epoch": 0.53, "learning_rate": 0.00022089900758902507, "loss": 0.017, "step": 48780 }, { "epoch": 0.53, "learning_rate": 0.00022088279172342216, "loss": 0.018, "step": 48790 }, { "epoch": 0.53, "learning_rate": 0.00022086657585781928, "loss": 0.0158, "step": 48800 }, { "epoch": 0.53, "learning_rate": 0.00022085035999221638, "loss": 0.0204, "step": 48810 }, { "epoch": 0.53, "learning_rate": 0.00022083414412661344, "loss": 0.0198, "step": 48820 }, { "epoch": 0.53, "learning_rate": 0.00022081792826101053, "loss": 0.0206, "step": 48830 }, { "epoch": 0.53, "learning_rate": 0.00022080171239540765, "loss": 0.016, "step": 48840 }, { "epoch": 0.53, "learning_rate": 0.00022078549652980475, "loss": 0.017, "step": 48850 }, { "epoch": 0.53, "learning_rate": 0.0002207692806642018, "loss": 0.0155, "step": 48860 }, { "epoch": 0.53, "learning_rate": 0.00022075306479859893, "loss": 0.0186, "step": 48870 }, { "epoch": 0.53, "learning_rate": 0.00022073684893299603, "loss": 0.0168, "step": 48880 }, { "epoch": 0.53, "learning_rate": 0.00022072063306739312, "loss": 0.0247, "step": 48890 }, { "epoch": 0.53, "learning_rate": 0.00022070441720179018, "loss": 0.0187, "step": 48900 }, { "epoch": 0.53, "learning_rate": 0.0002206882013361873, "loss": 0.0187, "step": 48910 }, { "epoch": 0.53, "learning_rate": 0.0002206719854705844, "loss": 0.0197, "step": 48920 }, { "epoch": 0.53, "learning_rate": 0.0002206557696049815, "loss": 0.0178, "step": 48930 }, { "epoch": 0.53, "learning_rate": 0.0002206395537393786, "loss": 0.02, "step": 48940 }, { "epoch": 0.53, "learning_rate": 0.00022062333787377567, "loss": 0.0209, "step": 48950 }, { "epoch": 0.53, "learning_rate": 0.00022060712200817277, "loss": 0.0193, "step": 48960 }, { "epoch": 0.53, "learning_rate": 0.0002205909061425699, "loss": 0.0298, "step": 48970 }, { "epoch": 0.53, "learning_rate": 0.00022057469027696698, "loss": 0.0256, "step": 48980 }, { "epoch": 0.53, "learning_rate": 0.00022055847441136405, "loss": 0.022, "step": 48990 }, { "epoch": 0.53, "learning_rate": 0.00022054225854576117, "loss": 0.0184, "step": 49000 }, { "epoch": 0.53, "eval_cer": 0.921567758848024, "eval_loss": 0.013597916811704636, "eval_runtime": 121.4697, "eval_samples_per_second": 16.465, "eval_steps_per_second": 4.116, "step": 49000 }, { "epoch": 0.53, "learning_rate": 0.00022052604268015826, "loss": 0.0191, "step": 49010 }, { "epoch": 0.53, "learning_rate": 0.00022050982681455535, "loss": 0.0179, "step": 49020 }, { "epoch": 0.53, "learning_rate": 0.00022049361094895242, "loss": 0.0198, "step": 49030 }, { "epoch": 0.53, "learning_rate": 0.00022047739508334954, "loss": 0.0202, "step": 49040 }, { "epoch": 0.53, "learning_rate": 0.00022046117921774663, "loss": 0.016, "step": 49050 }, { "epoch": 0.53, "learning_rate": 0.00022044496335214372, "loss": 0.0199, "step": 49060 }, { "epoch": 0.53, "learning_rate": 0.00022042874748654081, "loss": 0.0165, "step": 49070 }, { "epoch": 0.53, "learning_rate": 0.0002204125316209379, "loss": 0.0186, "step": 49080 }, { "epoch": 0.53, "learning_rate": 0.000220396315755335, "loss": 0.015, "step": 49090 }, { "epoch": 0.53, "learning_rate": 0.00022038009988973212, "loss": 0.0179, "step": 49100 }, { "epoch": 0.53, "learning_rate": 0.00022036388402412919, "loss": 0.0206, "step": 49110 }, { "epoch": 0.53, "learning_rate": 0.00022034766815852628, "loss": 0.0158, "step": 49120 }, { "epoch": 0.53, "learning_rate": 0.00022033145229292337, "loss": 0.0193, "step": 49130 }, { "epoch": 0.53, "learning_rate": 0.0002203152364273205, "loss": 0.0181, "step": 49140 }, { "epoch": 0.53, "learning_rate": 0.00022029902056171756, "loss": 0.0187, "step": 49150 }, { "epoch": 0.53, "learning_rate": 0.00022028280469611465, "loss": 0.0197, "step": 49160 }, { "epoch": 0.53, "learning_rate": 0.00022026658883051177, "loss": 0.0192, "step": 49170 }, { "epoch": 0.53, "learning_rate": 0.00022025037296490886, "loss": 0.0181, "step": 49180 }, { "epoch": 0.53, "learning_rate": 0.00022023415709930593, "loss": 0.0214, "step": 49190 }, { "epoch": 0.53, "learning_rate": 0.00022021794123370302, "loss": 0.0175, "step": 49200 }, { "epoch": 0.53, "learning_rate": 0.00022020172536810014, "loss": 0.0159, "step": 49210 }, { "epoch": 0.53, "learning_rate": 0.00022018550950249723, "loss": 0.0161, "step": 49220 }, { "epoch": 0.53, "learning_rate": 0.0002201692936368943, "loss": 0.0173, "step": 49230 }, { "epoch": 0.53, "learning_rate": 0.00022015307777129142, "loss": 0.0165, "step": 49240 }, { "epoch": 0.53, "learning_rate": 0.0002201368619056885, "loss": 0.0174, "step": 49250 }, { "epoch": 0.53, "learning_rate": 0.0002201206460400856, "loss": 0.0207, "step": 49260 }, { "epoch": 0.53, "learning_rate": 0.00022010443017448267, "loss": 0.0235, "step": 49270 }, { "epoch": 0.53, "learning_rate": 0.0002200882143088798, "loss": 0.019, "step": 49280 }, { "epoch": 0.53, "learning_rate": 0.00022007199844327688, "loss": 0.0155, "step": 49290 }, { "epoch": 0.53, "learning_rate": 0.000220055782577674, "loss": 0.0196, "step": 49300 }, { "epoch": 0.53, "learning_rate": 0.00022003956671207107, "loss": 0.0227, "step": 49310 }, { "epoch": 0.53, "learning_rate": 0.00022002335084646816, "loss": 0.0186, "step": 49320 }, { "epoch": 0.53, "learning_rate": 0.00022000713498086525, "loss": 0.0188, "step": 49330 }, { "epoch": 0.53, "learning_rate": 0.00021999091911526237, "loss": 0.0201, "step": 49340 }, { "epoch": 0.53, "learning_rate": 0.00021997470324965944, "loss": 0.0178, "step": 49350 }, { "epoch": 0.53, "learning_rate": 0.00021995848738405653, "loss": 0.0241, "step": 49360 }, { "epoch": 0.53, "learning_rate": 0.00021994227151845365, "loss": 0.0227, "step": 49370 }, { "epoch": 0.53, "learning_rate": 0.00021992605565285074, "loss": 0.0157, "step": 49380 }, { "epoch": 0.53, "learning_rate": 0.0002199098397872478, "loss": 0.0149, "step": 49390 }, { "epoch": 0.53, "learning_rate": 0.0002198936239216449, "loss": 0.017, "step": 49400 }, { "epoch": 0.53, "learning_rate": 0.00021987740805604202, "loss": 0.0238, "step": 49410 }, { "epoch": 0.53, "learning_rate": 0.00021986119219043912, "loss": 0.0172, "step": 49420 }, { "epoch": 0.53, "learning_rate": 0.00021984497632483618, "loss": 0.0191, "step": 49430 }, { "epoch": 0.53, "learning_rate": 0.0002198287604592333, "loss": 0.0171, "step": 49440 }, { "epoch": 0.53, "learning_rate": 0.0002198125445936304, "loss": 0.0158, "step": 49450 }, { "epoch": 0.53, "learning_rate": 0.00021979632872802749, "loss": 0.0169, "step": 49460 }, { "epoch": 0.53, "learning_rate": 0.00021978011286242455, "loss": 0.0189, "step": 49470 }, { "epoch": 0.53, "learning_rate": 0.00021976389699682167, "loss": 0.0164, "step": 49480 }, { "epoch": 0.54, "learning_rate": 0.00021974768113121876, "loss": 0.0204, "step": 49490 }, { "epoch": 0.54, "learning_rate": 0.00021973146526561586, "loss": 0.0191, "step": 49500 }, { "epoch": 0.54, "learning_rate": 0.00021971524940001295, "loss": 0.0214, "step": 49510 }, { "epoch": 0.54, "learning_rate": 0.00021969903353441004, "loss": 0.0211, "step": 49520 }, { "epoch": 0.54, "learning_rate": 0.00021968281766880714, "loss": 0.017, "step": 49530 }, { "epoch": 0.54, "learning_rate": 0.00021966660180320426, "loss": 0.02, "step": 49540 }, { "epoch": 0.54, "learning_rate": 0.00021965038593760132, "loss": 0.0175, "step": 49550 }, { "epoch": 0.54, "learning_rate": 0.00021963417007199841, "loss": 0.0213, "step": 49560 }, { "epoch": 0.54, "learning_rate": 0.0002196179542063955, "loss": 0.0212, "step": 49570 }, { "epoch": 0.54, "learning_rate": 0.00021960173834079263, "loss": 0.0168, "step": 49580 }, { "epoch": 0.54, "learning_rate": 0.0002195855224751897, "loss": 0.0204, "step": 49590 }, { "epoch": 0.54, "learning_rate": 0.00021956930660958678, "loss": 0.0174, "step": 49600 }, { "epoch": 0.54, "learning_rate": 0.0002195530907439839, "loss": 0.017, "step": 49610 }, { "epoch": 0.54, "learning_rate": 0.000219536874878381, "loss": 0.0193, "step": 49620 }, { "epoch": 0.54, "learning_rate": 0.00021952065901277806, "loss": 0.0178, "step": 49630 }, { "epoch": 0.54, "learning_rate": 0.00021950444314717516, "loss": 0.0185, "step": 49640 }, { "epoch": 0.54, "learning_rate": 0.00021948822728157228, "loss": 0.0172, "step": 49650 }, { "epoch": 0.54, "learning_rate": 0.00021947201141596937, "loss": 0.0166, "step": 49660 }, { "epoch": 0.54, "learning_rate": 0.0002194557955503665, "loss": 0.019, "step": 49670 }, { "epoch": 0.54, "learning_rate": 0.00021943957968476355, "loss": 0.0192, "step": 49680 }, { "epoch": 0.54, "learning_rate": 0.00021942336381916065, "loss": 0.0197, "step": 49690 }, { "epoch": 0.54, "learning_rate": 0.00021940714795355774, "loss": 0.0171, "step": 49700 }, { "epoch": 0.54, "learning_rate": 0.00021939093208795486, "loss": 0.017, "step": 49710 }, { "epoch": 0.54, "learning_rate": 0.00021937471622235192, "loss": 0.0172, "step": 49720 }, { "epoch": 0.54, "learning_rate": 0.00021935850035674902, "loss": 0.0178, "step": 49730 }, { "epoch": 0.54, "learning_rate": 0.00021934228449114614, "loss": 0.0167, "step": 49740 }, { "epoch": 0.54, "learning_rate": 0.00021932606862554323, "loss": 0.0191, "step": 49750 }, { "epoch": 0.54, "learning_rate": 0.0002193098527599403, "loss": 0.0176, "step": 49760 }, { "epoch": 0.54, "learning_rate": 0.0002192936368943374, "loss": 0.0168, "step": 49770 }, { "epoch": 0.54, "learning_rate": 0.0002192774210287345, "loss": 0.0167, "step": 49780 }, { "epoch": 0.54, "learning_rate": 0.0002192612051631316, "loss": 0.0189, "step": 49790 }, { "epoch": 0.54, "learning_rate": 0.00021924498929752867, "loss": 0.017, "step": 49800 }, { "epoch": 0.54, "learning_rate": 0.00021922877343192579, "loss": 0.0153, "step": 49810 }, { "epoch": 0.54, "learning_rate": 0.00021921255756632288, "loss": 0.0171, "step": 49820 }, { "epoch": 0.54, "learning_rate": 0.00021919634170071997, "loss": 0.0226, "step": 49830 }, { "epoch": 0.54, "learning_rate": 0.00021918012583511704, "loss": 0.0217, "step": 49840 }, { "epoch": 0.54, "learning_rate": 0.00021916390996951416, "loss": 0.0209, "step": 49850 }, { "epoch": 0.54, "learning_rate": 0.00021914769410391125, "loss": 0.0174, "step": 49860 }, { "epoch": 0.54, "learning_rate": 0.00021913147823830834, "loss": 0.016, "step": 49870 }, { "epoch": 0.54, "learning_rate": 0.00021911526237270544, "loss": 0.0164, "step": 49880 }, { "epoch": 0.54, "learning_rate": 0.00021909904650710253, "loss": 0.0161, "step": 49890 }, { "epoch": 0.54, "learning_rate": 0.00021908283064149962, "loss": 0.0161, "step": 49900 }, { "epoch": 0.54, "learning_rate": 0.00021906661477589674, "loss": 0.0174, "step": 49910 }, { "epoch": 0.54, "learning_rate": 0.0002190503989102938, "loss": 0.0155, "step": 49920 }, { "epoch": 0.54, "learning_rate": 0.0002190341830446909, "loss": 0.0178, "step": 49930 }, { "epoch": 0.54, "learning_rate": 0.000219017967179088, "loss": 0.0185, "step": 49940 }, { "epoch": 0.54, "learning_rate": 0.0002190017513134851, "loss": 0.0155, "step": 49950 }, { "epoch": 0.54, "learning_rate": 0.00021898553544788218, "loss": 0.0171, "step": 49960 }, { "epoch": 0.54, "learning_rate": 0.00021896931958227927, "loss": 0.0163, "step": 49970 }, { "epoch": 0.54, "learning_rate": 0.0002189531037166764, "loss": 0.0167, "step": 49980 }, { "epoch": 0.54, "learning_rate": 0.00021893688785107348, "loss": 0.0218, "step": 49990 }, { "epoch": 0.54, "learning_rate": 0.00021892067198547055, "loss": 0.0191, "step": 50000 }, { "epoch": 0.54, "eval_cer": 0.9215842623041952, "eval_loss": 0.012915155850350857, "eval_runtime": 121.4472, "eval_samples_per_second": 16.468, "eval_steps_per_second": 4.117, "step": 50000 }, { "epoch": 0.54, "learning_rate": 0.00021890445611986767, "loss": 0.0204, "step": 50010 }, { "epoch": 0.54, "learning_rate": 0.00021888824025426476, "loss": 0.0174, "step": 50020 }, { "epoch": 0.54, "learning_rate": 0.00021887202438866185, "loss": 0.0203, "step": 50030 }, { "epoch": 0.54, "learning_rate": 0.00021885580852305892, "loss": 0.0191, "step": 50040 }, { "epoch": 0.54, "learning_rate": 0.00021883959265745604, "loss": 0.0184, "step": 50050 }, { "epoch": 0.54, "learning_rate": 0.00021882337679185313, "loss": 0.016, "step": 50060 }, { "epoch": 0.54, "learning_rate": 0.00021880716092625022, "loss": 0.0182, "step": 50070 }, { "epoch": 0.54, "learning_rate": 0.00021879094506064732, "loss": 0.0141, "step": 50080 }, { "epoch": 0.54, "learning_rate": 0.0002187747291950444, "loss": 0.0184, "step": 50090 }, { "epoch": 0.54, "learning_rate": 0.0002187585133294415, "loss": 0.0171, "step": 50100 }, { "epoch": 0.54, "learning_rate": 0.00021874229746383862, "loss": 0.0196, "step": 50110 }, { "epoch": 0.54, "learning_rate": 0.0002187260815982357, "loss": 0.0165, "step": 50120 }, { "epoch": 0.54, "learning_rate": 0.00021870986573263278, "loss": 0.0215, "step": 50130 }, { "epoch": 0.54, "learning_rate": 0.00021869364986702987, "loss": 0.0177, "step": 50140 }, { "epoch": 0.54, "learning_rate": 0.000218677434001427, "loss": 0.0229, "step": 50150 }, { "epoch": 0.54, "learning_rate": 0.00021866121813582406, "loss": 0.0169, "step": 50160 }, { "epoch": 0.54, "learning_rate": 0.00021864500227022115, "loss": 0.0163, "step": 50170 }, { "epoch": 0.54, "learning_rate": 0.00021862878640461827, "loss": 0.0187, "step": 50180 }, { "epoch": 0.54, "learning_rate": 0.00021861257053901536, "loss": 0.0169, "step": 50190 }, { "epoch": 0.54, "learning_rate": 0.00021859635467341243, "loss": 0.0178, "step": 50200 }, { "epoch": 0.54, "learning_rate": 0.00021858013880780952, "loss": 0.0177, "step": 50210 }, { "epoch": 0.54, "learning_rate": 0.00021856392294220664, "loss": 0.0155, "step": 50220 }, { "epoch": 0.54, "learning_rate": 0.00021854770707660374, "loss": 0.0144, "step": 50230 }, { "epoch": 0.54, "learning_rate": 0.0002185314912110008, "loss": 0.0227, "step": 50240 }, { "epoch": 0.54, "learning_rate": 0.00021851527534539792, "loss": 0.0183, "step": 50250 }, { "epoch": 0.54, "learning_rate": 0.00021849905947979501, "loss": 0.0161, "step": 50260 }, { "epoch": 0.54, "learning_rate": 0.0002184828436141921, "loss": 0.0199, "step": 50270 }, { "epoch": 0.54, "learning_rate": 0.00021846662774858917, "loss": 0.016, "step": 50280 }, { "epoch": 0.54, "learning_rate": 0.0002184504118829863, "loss": 0.016, "step": 50290 }, { "epoch": 0.54, "learning_rate": 0.00021843419601738339, "loss": 0.0188, "step": 50300 }, { "epoch": 0.54, "learning_rate": 0.0002184179801517805, "loss": 0.0154, "step": 50310 }, { "epoch": 0.54, "learning_rate": 0.00021840176428617757, "loss": 0.0222, "step": 50320 }, { "epoch": 0.54, "learning_rate": 0.00021838554842057466, "loss": 0.0194, "step": 50330 }, { "epoch": 0.54, "learning_rate": 0.00021836933255497176, "loss": 0.0159, "step": 50340 }, { "epoch": 0.54, "learning_rate": 0.00021835311668936888, "loss": 0.0183, "step": 50350 }, { "epoch": 0.54, "learning_rate": 0.00021833690082376597, "loss": 0.0167, "step": 50360 }, { "epoch": 0.54, "learning_rate": 0.00021832068495816303, "loss": 0.0178, "step": 50370 }, { "epoch": 0.54, "learning_rate": 0.00021830446909256015, "loss": 0.0144, "step": 50380 }, { "epoch": 0.54, "learning_rate": 0.00021828825322695725, "loss": 0.0199, "step": 50390 }, { "epoch": 0.54, "learning_rate": 0.00021827203736135434, "loss": 0.0172, "step": 50400 }, { "epoch": 0.54, "learning_rate": 0.0002182558214957514, "loss": 0.0214, "step": 50410 }, { "epoch": 0.55, "learning_rate": 0.00021823960563014853, "loss": 0.0189, "step": 50420 }, { "epoch": 0.55, "learning_rate": 0.00021822338976454562, "loss": 0.0173, "step": 50430 }, { "epoch": 0.55, "learning_rate": 0.0002182071738989427, "loss": 0.0194, "step": 50440 }, { "epoch": 0.55, "learning_rate": 0.0002181909580333398, "loss": 0.0166, "step": 50450 }, { "epoch": 0.55, "learning_rate": 0.0002181747421677369, "loss": 0.0183, "step": 50460 }, { "epoch": 0.55, "learning_rate": 0.000218158526302134, "loss": 0.0171, "step": 50470 }, { "epoch": 0.55, "learning_rate": 0.0002181423104365311, "loss": 0.0211, "step": 50480 }, { "epoch": 0.55, "learning_rate": 0.00021812609457092817, "loss": 0.0205, "step": 50490 }, { "epoch": 0.55, "learning_rate": 0.00021810987870532527, "loss": 0.0207, "step": 50500 }, { "epoch": 0.55, "learning_rate": 0.00021809366283972236, "loss": 0.0188, "step": 50510 }, { "epoch": 0.55, "learning_rate": 0.00021807744697411948, "loss": 0.0188, "step": 50520 }, { "epoch": 0.55, "learning_rate": 0.00021806123110851655, "loss": 0.0175, "step": 50530 }, { "epoch": 0.55, "learning_rate": 0.00021804501524291364, "loss": 0.0212, "step": 50540 }, { "epoch": 0.55, "learning_rate": 0.00021802879937731076, "loss": 0.0153, "step": 50550 }, { "epoch": 0.55, "learning_rate": 0.00021801258351170785, "loss": 0.021, "step": 50560 }, { "epoch": 0.55, "learning_rate": 0.00021799636764610492, "loss": 0.0177, "step": 50570 }, { "epoch": 0.55, "learning_rate": 0.000217980151780502, "loss": 0.0155, "step": 50580 }, { "epoch": 0.55, "learning_rate": 0.00021796393591489913, "loss": 0.0162, "step": 50590 }, { "epoch": 0.55, "learning_rate": 0.00021794772004929622, "loss": 0.0197, "step": 50600 }, { "epoch": 0.55, "learning_rate": 0.0002179315041836933, "loss": 0.0168, "step": 50610 }, { "epoch": 0.55, "learning_rate": 0.0002179152883180904, "loss": 0.0175, "step": 50620 }, { "epoch": 0.55, "learning_rate": 0.0002178990724524875, "loss": 0.0186, "step": 50630 }, { "epoch": 0.55, "learning_rate": 0.0002178828565868846, "loss": 0.0174, "step": 50640 }, { "epoch": 0.55, "learning_rate": 0.00021786664072128166, "loss": 0.0211, "step": 50650 }, { "epoch": 0.55, "learning_rate": 0.00021785042485567878, "loss": 0.0176, "step": 50660 }, { "epoch": 0.55, "learning_rate": 0.00021783420899007587, "loss": 0.0202, "step": 50670 }, { "epoch": 0.55, "learning_rate": 0.000217817993124473, "loss": 0.0184, "step": 50680 }, { "epoch": 0.55, "learning_rate": 0.00021780177725887006, "loss": 0.0174, "step": 50690 }, { "epoch": 0.55, "learning_rate": 0.00021778556139326715, "loss": 0.0181, "step": 50700 }, { "epoch": 0.55, "learning_rate": 0.00021776934552766424, "loss": 0.0168, "step": 50710 }, { "epoch": 0.55, "learning_rate": 0.00021775312966206136, "loss": 0.0176, "step": 50720 }, { "epoch": 0.55, "learning_rate": 0.00021773691379645843, "loss": 0.0166, "step": 50730 }, { "epoch": 0.55, "learning_rate": 0.00021772069793085552, "loss": 0.0215, "step": 50740 }, { "epoch": 0.55, "learning_rate": 0.00021770448206525264, "loss": 0.0183, "step": 50750 }, { "epoch": 0.55, "learning_rate": 0.00021768826619964973, "loss": 0.0198, "step": 50760 }, { "epoch": 0.55, "learning_rate": 0.0002176720503340468, "loss": 0.0157, "step": 50770 }, { "epoch": 0.55, "learning_rate": 0.0002176558344684439, "loss": 0.0192, "step": 50780 }, { "epoch": 0.55, "learning_rate": 0.000217639618602841, "loss": 0.0194, "step": 50790 }, { "epoch": 0.55, "learning_rate": 0.0002176234027372381, "loss": 0.0168, "step": 50800 }, { "epoch": 0.55, "learning_rate": 0.00021760718687163517, "loss": 0.0196, "step": 50810 }, { "epoch": 0.55, "learning_rate": 0.0002175909710060323, "loss": 0.0191, "step": 50820 }, { "epoch": 0.55, "learning_rate": 0.00021757475514042938, "loss": 0.0192, "step": 50830 }, { "epoch": 0.55, "learning_rate": 0.00021755853927482647, "loss": 0.0203, "step": 50840 }, { "epoch": 0.55, "learning_rate": 0.00021754232340922354, "loss": 0.0162, "step": 50850 }, { "epoch": 0.55, "learning_rate": 0.00021752610754362066, "loss": 0.0187, "step": 50860 }, { "epoch": 0.55, "learning_rate": 0.00021750989167801775, "loss": 0.0172, "step": 50870 }, { "epoch": 0.55, "learning_rate": 0.00021749367581241485, "loss": 0.0181, "step": 50880 }, { "epoch": 0.55, "learning_rate": 0.00021747745994681194, "loss": 0.0176, "step": 50890 }, { "epoch": 0.55, "learning_rate": 0.00021746124408120903, "loss": 0.0166, "step": 50900 }, { "epoch": 0.55, "learning_rate": 0.00021744502821560612, "loss": 0.019, "step": 50910 }, { "epoch": 0.55, "learning_rate": 0.00021742881235000324, "loss": 0.0197, "step": 50920 }, { "epoch": 0.55, "learning_rate": 0.0002174125964844003, "loss": 0.015, "step": 50930 }, { "epoch": 0.55, "learning_rate": 0.0002173963806187974, "loss": 0.0164, "step": 50940 }, { "epoch": 0.55, "learning_rate": 0.0002173801647531945, "loss": 0.0161, "step": 50950 }, { "epoch": 0.55, "learning_rate": 0.00021736394888759161, "loss": 0.0182, "step": 50960 }, { "epoch": 0.55, "learning_rate": 0.00021734773302198868, "loss": 0.0151, "step": 50970 }, { "epoch": 0.55, "learning_rate": 0.00021733151715638577, "loss": 0.0166, "step": 50980 }, { "epoch": 0.55, "learning_rate": 0.0002173153012907829, "loss": 0.0201, "step": 50990 }, { "epoch": 0.55, "learning_rate": 0.00021729908542517999, "loss": 0.017, "step": 51000 }, { "epoch": 0.55, "eval_cer": 0.921579050686457, "eval_loss": 0.012746312655508518, "eval_runtime": 121.6627, "eval_samples_per_second": 16.439, "eval_steps_per_second": 4.11, "step": 51000 }, { "epoch": 0.55, "learning_rate": 0.00021728286955957705, "loss": 0.0226, "step": 51010 }, { "epoch": 0.55, "learning_rate": 0.00021726665369397417, "loss": 0.0193, "step": 51020 }, { "epoch": 0.55, "learning_rate": 0.00021725043782837126, "loss": 0.0194, "step": 51030 }, { "epoch": 0.55, "learning_rate": 0.00021723422196276836, "loss": 0.0167, "step": 51040 }, { "epoch": 0.55, "learning_rate": 0.00021721800609716542, "loss": 0.0164, "step": 51050 }, { "epoch": 0.55, "learning_rate": 0.00021720179023156254, "loss": 0.0173, "step": 51060 }, { "epoch": 0.55, "learning_rate": 0.00021718557436595963, "loss": 0.0186, "step": 51070 }, { "epoch": 0.55, "learning_rate": 0.00021716935850035673, "loss": 0.0221, "step": 51080 }, { "epoch": 0.55, "learning_rate": 0.00021715314263475385, "loss": 0.0229, "step": 51090 }, { "epoch": 0.55, "learning_rate": 0.0002171369267691509, "loss": 0.0208, "step": 51100 }, { "epoch": 0.55, "learning_rate": 0.000217120710903548, "loss": 0.017, "step": 51110 }, { "epoch": 0.55, "learning_rate": 0.00021710449503794513, "loss": 0.0177, "step": 51120 }, { "epoch": 0.55, "learning_rate": 0.00021708827917234222, "loss": 0.0165, "step": 51130 }, { "epoch": 0.55, "learning_rate": 0.00021707206330673928, "loss": 0.0159, "step": 51140 }, { "epoch": 0.55, "learning_rate": 0.00021705584744113638, "loss": 0.0208, "step": 51150 }, { "epoch": 0.55, "learning_rate": 0.0002170396315755335, "loss": 0.0175, "step": 51160 }, { "epoch": 0.55, "learning_rate": 0.0002170234157099306, "loss": 0.0155, "step": 51170 }, { "epoch": 0.55, "learning_rate": 0.00021700719984432765, "loss": 0.018, "step": 51180 }, { "epoch": 0.55, "learning_rate": 0.00021699098397872477, "loss": 0.0177, "step": 51190 }, { "epoch": 0.55, "learning_rate": 0.00021697476811312187, "loss": 0.022, "step": 51200 }, { "epoch": 0.55, "learning_rate": 0.00021695855224751896, "loss": 0.0152, "step": 51210 }, { "epoch": 0.55, "learning_rate": 0.00021694233638191603, "loss": 0.0151, "step": 51220 }, { "epoch": 0.55, "learning_rate": 0.00021692612051631315, "loss": 0.0176, "step": 51230 }, { "epoch": 0.55, "learning_rate": 0.00021690990465071024, "loss": 0.0147, "step": 51240 }, { "epoch": 0.55, "learning_rate": 0.00021689368878510733, "loss": 0.0166, "step": 51250 }, { "epoch": 0.55, "learning_rate": 0.00021687747291950442, "loss": 0.0183, "step": 51260 }, { "epoch": 0.55, "learning_rate": 0.00021686125705390152, "loss": 0.02, "step": 51270 }, { "epoch": 0.55, "learning_rate": 0.0002168450411882986, "loss": 0.0192, "step": 51280 }, { "epoch": 0.55, "learning_rate": 0.00021682882532269573, "loss": 0.0202, "step": 51290 }, { "epoch": 0.55, "learning_rate": 0.0002168126094570928, "loss": 0.015, "step": 51300 }, { "epoch": 0.55, "learning_rate": 0.0002167963935914899, "loss": 0.0151, "step": 51310 }, { "epoch": 0.55, "learning_rate": 0.000216780177725887, "loss": 0.0178, "step": 51320 }, { "epoch": 0.55, "learning_rate": 0.0002167639618602841, "loss": 0.0185, "step": 51330 }, { "epoch": 0.56, "learning_rate": 0.00021674774599468117, "loss": 0.0198, "step": 51340 }, { "epoch": 0.56, "learning_rate": 0.00021673153012907826, "loss": 0.0171, "step": 51350 }, { "epoch": 0.56, "learning_rate": 0.00021671531426347538, "loss": 0.0182, "step": 51360 }, { "epoch": 0.56, "learning_rate": 0.00021669909839787247, "loss": 0.0169, "step": 51370 }, { "epoch": 0.56, "learning_rate": 0.00021668288253226954, "loss": 0.0173, "step": 51380 }, { "epoch": 0.56, "learning_rate": 0.00021666666666666666, "loss": 0.0155, "step": 51390 }, { "epoch": 0.56, "learning_rate": 0.00021665045080106375, "loss": 0.0168, "step": 51400 }, { "epoch": 0.56, "learning_rate": 0.00021663423493546084, "loss": 0.0177, "step": 51410 }, { "epoch": 0.56, "learning_rate": 0.0002166180190698579, "loss": 0.0219, "step": 51420 }, { "epoch": 0.56, "learning_rate": 0.00021660180320425503, "loss": 0.0199, "step": 51430 }, { "epoch": 0.56, "learning_rate": 0.00021658558733865212, "loss": 0.0171, "step": 51440 }, { "epoch": 0.56, "learning_rate": 0.0002165693714730492, "loss": 0.0192, "step": 51450 }, { "epoch": 0.56, "learning_rate": 0.0002165531556074463, "loss": 0.0174, "step": 51460 }, { "epoch": 0.56, "learning_rate": 0.0002165369397418434, "loss": 0.0175, "step": 51470 }, { "epoch": 0.56, "learning_rate": 0.0002165207238762405, "loss": 0.0185, "step": 51480 }, { "epoch": 0.56, "learning_rate": 0.0002165045080106376, "loss": 0.0147, "step": 51490 }, { "epoch": 0.56, "learning_rate": 0.00021648829214503468, "loss": 0.0194, "step": 51500 }, { "epoch": 0.56, "learning_rate": 0.00021647207627943177, "loss": 0.0168, "step": 51510 }, { "epoch": 0.56, "learning_rate": 0.00021645586041382886, "loss": 0.015, "step": 51520 }, { "epoch": 0.56, "learning_rate": 0.00021643964454822598, "loss": 0.0157, "step": 51530 }, { "epoch": 0.56, "learning_rate": 0.00021642342868262305, "loss": 0.0185, "step": 51540 }, { "epoch": 0.56, "learning_rate": 0.00021640721281702014, "loss": 0.0169, "step": 51550 }, { "epoch": 0.56, "learning_rate": 0.00021639099695141726, "loss": 0.0211, "step": 51560 }, { "epoch": 0.56, "learning_rate": 0.00021637478108581435, "loss": 0.019, "step": 51570 }, { "epoch": 0.56, "learning_rate": 0.00021635856522021142, "loss": 0.0183, "step": 51580 }, { "epoch": 0.56, "learning_rate": 0.0002163423493546085, "loss": 0.0171, "step": 51590 }, { "epoch": 0.56, "learning_rate": 0.00021632613348900563, "loss": 0.0155, "step": 51600 }, { "epoch": 0.56, "learning_rate": 0.00021630991762340272, "loss": 0.0195, "step": 51610 }, { "epoch": 0.56, "learning_rate": 0.0002162937017577998, "loss": 0.0184, "step": 51620 }, { "epoch": 0.56, "learning_rate": 0.0002162774858921969, "loss": 0.021, "step": 51630 }, { "epoch": 0.56, "learning_rate": 0.000216261270026594, "loss": 0.0163, "step": 51640 }, { "epoch": 0.56, "learning_rate": 0.0002162450541609911, "loss": 0.022, "step": 51650 }, { "epoch": 0.56, "learning_rate": 0.00021622883829538816, "loss": 0.0176, "step": 51660 }, { "epoch": 0.56, "learning_rate": 0.00021621262242978528, "loss": 0.0198, "step": 51670 }, { "epoch": 0.56, "learning_rate": 0.00021619640656418237, "loss": 0.0169, "step": 51680 }, { "epoch": 0.56, "learning_rate": 0.0002161801906985795, "loss": 0.0197, "step": 51690 }, { "epoch": 0.56, "learning_rate": 0.00021616397483297656, "loss": 0.0156, "step": 51700 }, { "epoch": 0.56, "learning_rate": 0.00021614775896737365, "loss": 0.0193, "step": 51710 }, { "epoch": 0.56, "learning_rate": 0.00021613154310177074, "loss": 0.015, "step": 51720 }, { "epoch": 0.56, "learning_rate": 0.00021611532723616786, "loss": 0.0154, "step": 51730 }, { "epoch": 0.56, "learning_rate": 0.00021609911137056493, "loss": 0.0174, "step": 51740 }, { "epoch": 0.56, "learning_rate": 0.00021608289550496202, "loss": 0.0193, "step": 51750 }, { "epoch": 0.56, "learning_rate": 0.00021606667963935914, "loss": 0.0192, "step": 51760 }, { "epoch": 0.56, "learning_rate": 0.00021605046377375624, "loss": 0.0211, "step": 51770 }, { "epoch": 0.56, "learning_rate": 0.0002160342479081533, "loss": 0.0146, "step": 51780 }, { "epoch": 0.56, "learning_rate": 0.0002160180320425504, "loss": 0.0188, "step": 51790 }, { "epoch": 0.56, "learning_rate": 0.0002160018161769475, "loss": 0.0145, "step": 51800 }, { "epoch": 0.56, "learning_rate": 0.0002159856003113446, "loss": 0.0165, "step": 51810 }, { "epoch": 0.56, "learning_rate": 0.0002159693844457417, "loss": 0.0174, "step": 51820 }, { "epoch": 0.56, "learning_rate": 0.0002159531685801388, "loss": 0.0205, "step": 51830 }, { "epoch": 0.56, "learning_rate": 0.00021593695271453588, "loss": 0.0159, "step": 51840 }, { "epoch": 0.56, "learning_rate": 0.00021592073684893298, "loss": 0.0198, "step": 51850 }, { "epoch": 0.56, "learning_rate": 0.0002159045209833301, "loss": 0.0198, "step": 51860 }, { "epoch": 0.56, "learning_rate": 0.00021588830511772716, "loss": 0.016, "step": 51870 }, { "epoch": 0.56, "learning_rate": 0.00021587208925212426, "loss": 0.0207, "step": 51880 }, { "epoch": 0.56, "learning_rate": 0.00021585587338652135, "loss": 0.0166, "step": 51890 }, { "epoch": 0.56, "learning_rate": 0.00021583965752091847, "loss": 0.0183, "step": 51900 }, { "epoch": 0.56, "learning_rate": 0.00021582344165531553, "loss": 0.0172, "step": 51910 }, { "epoch": 0.56, "learning_rate": 0.00021580722578971263, "loss": 0.0159, "step": 51920 }, { "epoch": 0.56, "learning_rate": 0.00021579100992410975, "loss": 0.0147, "step": 51930 }, { "epoch": 0.56, "learning_rate": 0.00021577479405850684, "loss": 0.0162, "step": 51940 }, { "epoch": 0.56, "learning_rate": 0.0002157585781929039, "loss": 0.0153, "step": 51950 }, { "epoch": 0.56, "learning_rate": 0.000215742362327301, "loss": 0.0173, "step": 51960 }, { "epoch": 0.56, "learning_rate": 0.00021572614646169812, "loss": 0.0166, "step": 51970 }, { "epoch": 0.56, "learning_rate": 0.0002157099305960952, "loss": 0.021, "step": 51980 }, { "epoch": 0.56, "learning_rate": 0.00021569371473049228, "loss": 0.0174, "step": 51990 }, { "epoch": 0.56, "learning_rate": 0.0002156774988648894, "loss": 0.0188, "step": 52000 }, { "epoch": 0.56, "eval_cer": 0.9215338833327253, "eval_loss": 0.01269690040498972, "eval_runtime": 121.7858, "eval_samples_per_second": 16.422, "eval_steps_per_second": 4.106, "step": 52000 }, { "epoch": 0.56, "learning_rate": 0.0002156612829992865, "loss": 0.0184, "step": 52010 }, { "epoch": 0.56, "learning_rate": 0.00021564506713368358, "loss": 0.0176, "step": 52020 }, { "epoch": 0.56, "learning_rate": 0.00021562885126808067, "loss": 0.0194, "step": 52030 }, { "epoch": 0.56, "learning_rate": 0.00021561263540247777, "loss": 0.0167, "step": 52040 }, { "epoch": 0.56, "learning_rate": 0.00021559641953687486, "loss": 0.0171, "step": 52050 }, { "epoch": 0.56, "learning_rate": 0.00021558020367127198, "loss": 0.0203, "step": 52060 }, { "epoch": 0.56, "learning_rate": 0.00021556398780566904, "loss": 0.0203, "step": 52070 }, { "epoch": 0.56, "learning_rate": 0.00021554777194006614, "loss": 0.0205, "step": 52080 }, { "epoch": 0.56, "learning_rate": 0.00021553155607446323, "loss": 0.0186, "step": 52090 }, { "epoch": 0.56, "learning_rate": 0.00021551534020886035, "loss": 0.0261, "step": 52100 }, { "epoch": 0.56, "learning_rate": 0.00021549912434325742, "loss": 0.0154, "step": 52110 }, { "epoch": 0.56, "learning_rate": 0.0002154829084776545, "loss": 0.0199, "step": 52120 }, { "epoch": 0.56, "learning_rate": 0.00021546669261205163, "loss": 0.0178, "step": 52130 }, { "epoch": 0.56, "learning_rate": 0.00021545047674644872, "loss": 0.0346, "step": 52140 }, { "epoch": 0.56, "learning_rate": 0.0002154342608808458, "loss": 0.0188, "step": 52150 }, { "epoch": 0.56, "learning_rate": 0.00021541804501524288, "loss": 0.0178, "step": 52160 }, { "epoch": 0.56, "learning_rate": 0.00021540182914964, "loss": 0.017, "step": 52170 }, { "epoch": 0.56, "learning_rate": 0.0002153856132840371, "loss": 0.022, "step": 52180 }, { "epoch": 0.56, "learning_rate": 0.00021536939741843416, "loss": 0.0169, "step": 52190 }, { "epoch": 0.56, "learning_rate": 0.00021535318155283128, "loss": 0.0167, "step": 52200 }, { "epoch": 0.56, "learning_rate": 0.00021533696568722837, "loss": 0.0176, "step": 52210 }, { "epoch": 0.56, "learning_rate": 0.00021532074982162546, "loss": 0.0163, "step": 52220 }, { "epoch": 0.56, "learning_rate": 0.00021530453395602253, "loss": 0.0206, "step": 52230 }, { "epoch": 0.56, "learning_rate": 0.00021528831809041965, "loss": 0.0177, "step": 52240 }, { "epoch": 0.56, "learning_rate": 0.00021527210222481674, "loss": 0.0202, "step": 52250 }, { "epoch": 0.56, "learning_rate": 0.00021525588635921383, "loss": 0.0181, "step": 52260 }, { "epoch": 0.57, "learning_rate": 0.00021523967049361093, "loss": 0.0167, "step": 52270 }, { "epoch": 0.57, "learning_rate": 0.00021522345462800802, "loss": 0.0154, "step": 52280 }, { "epoch": 0.57, "learning_rate": 0.0002152072387624051, "loss": 0.0166, "step": 52290 }, { "epoch": 0.57, "learning_rate": 0.00021519102289680223, "loss": 0.0156, "step": 52300 }, { "epoch": 0.57, "learning_rate": 0.0002151748070311993, "loss": 0.0164, "step": 52310 }, { "epoch": 0.57, "learning_rate": 0.0002151585911655964, "loss": 0.0206, "step": 52320 }, { "epoch": 0.57, "learning_rate": 0.0002151423752999935, "loss": 0.0172, "step": 52330 }, { "epoch": 0.57, "learning_rate": 0.0002151261594343906, "loss": 0.0189, "step": 52340 }, { "epoch": 0.57, "learning_rate": 0.00021510994356878767, "loss": 0.016, "step": 52350 }, { "epoch": 0.57, "learning_rate": 0.00021509372770318476, "loss": 0.0159, "step": 52360 }, { "epoch": 0.57, "learning_rate": 0.00021507751183758188, "loss": 0.0205, "step": 52370 }, { "epoch": 0.57, "learning_rate": 0.00021506129597197897, "loss": 0.0155, "step": 52380 }, { "epoch": 0.57, "learning_rate": 0.00021504508010637604, "loss": 0.0423, "step": 52390 }, { "epoch": 0.57, "learning_rate": 0.00021502886424077316, "loss": 0.0137, "step": 52400 }, { "epoch": 0.57, "learning_rate": 0.00021501264837517025, "loss": 0.0178, "step": 52410 }, { "epoch": 0.57, "learning_rate": 0.00021499643250956734, "loss": 0.0164, "step": 52420 }, { "epoch": 0.57, "learning_rate": 0.0002149802166439644, "loss": 0.0183, "step": 52430 }, { "epoch": 0.57, "learning_rate": 0.00021496400077836153, "loss": 0.0189, "step": 52440 }, { "epoch": 0.57, "learning_rate": 0.00021494778491275862, "loss": 0.0196, "step": 52450 }, { "epoch": 0.57, "learning_rate": 0.00021493156904715572, "loss": 0.0183, "step": 52460 }, { "epoch": 0.57, "learning_rate": 0.0002149153531815528, "loss": 0.0152, "step": 52470 }, { "epoch": 0.57, "learning_rate": 0.0002148991373159499, "loss": 0.0175, "step": 52480 }, { "epoch": 0.57, "learning_rate": 0.000214882921450347, "loss": 0.0172, "step": 52490 }, { "epoch": 0.57, "learning_rate": 0.00021486670558474411, "loss": 0.0155, "step": 52500 }, { "epoch": 0.57, "learning_rate": 0.0002148504897191412, "loss": 0.0165, "step": 52510 }, { "epoch": 0.57, "learning_rate": 0.00021483427385353827, "loss": 0.0179, "step": 52520 }, { "epoch": 0.57, "learning_rate": 0.00021481805798793536, "loss": 0.017, "step": 52530 }, { "epoch": 0.57, "learning_rate": 0.00021480184212233248, "loss": 0.017, "step": 52540 }, { "epoch": 0.57, "learning_rate": 0.00021478562625672958, "loss": 0.0174, "step": 52550 }, { "epoch": 0.57, "learning_rate": 0.00021476941039112664, "loss": 0.0159, "step": 52560 }, { "epoch": 0.57, "learning_rate": 0.00021475319452552376, "loss": 0.0169, "step": 52570 }, { "epoch": 0.57, "learning_rate": 0.00021473697865992086, "loss": 0.0181, "step": 52580 }, { "epoch": 0.57, "learning_rate": 0.00021472076279431795, "loss": 0.0199, "step": 52590 }, { "epoch": 0.57, "learning_rate": 0.00021470454692871501, "loss": 0.014, "step": 52600 }, { "epoch": 0.57, "learning_rate": 0.00021468833106311213, "loss": 0.0227, "step": 52610 }, { "epoch": 0.57, "learning_rate": 0.00021467211519750923, "loss": 0.0188, "step": 52620 }, { "epoch": 0.57, "learning_rate": 0.00021465589933190635, "loss": 0.0149, "step": 52630 }, { "epoch": 0.57, "learning_rate": 0.0002146396834663034, "loss": 0.0178, "step": 52640 }, { "epoch": 0.57, "learning_rate": 0.0002146234676007005, "loss": 0.0188, "step": 52650 }, { "epoch": 0.57, "learning_rate": 0.0002146072517350976, "loss": 0.0178, "step": 52660 }, { "epoch": 0.57, "learning_rate": 0.00021459103586949472, "loss": 0.0158, "step": 52670 }, { "epoch": 0.57, "learning_rate": 0.00021457482000389178, "loss": 0.0199, "step": 52680 }, { "epoch": 0.57, "learning_rate": 0.00021455860413828888, "loss": 0.0143, "step": 52690 }, { "epoch": 0.57, "learning_rate": 0.000214542388272686, "loss": 0.018, "step": 52700 }, { "epoch": 0.57, "learning_rate": 0.0002145261724070831, "loss": 0.0189, "step": 52710 }, { "epoch": 0.57, "learning_rate": 0.00021450995654148015, "loss": 0.0154, "step": 52720 }, { "epoch": 0.57, "learning_rate": 0.00021449374067587725, "loss": 0.0158, "step": 52730 }, { "epoch": 0.57, "learning_rate": 0.00021447752481027437, "loss": 0.0167, "step": 52740 }, { "epoch": 0.57, "learning_rate": 0.00021446130894467146, "loss": 0.0196, "step": 52750 }, { "epoch": 0.57, "learning_rate": 0.00021444509307906853, "loss": 0.017, "step": 52760 }, { "epoch": 0.57, "learning_rate": 0.00021442887721346565, "loss": 0.019, "step": 52770 }, { "epoch": 0.57, "learning_rate": 0.00021441266134786274, "loss": 0.0194, "step": 52780 }, { "epoch": 0.57, "learning_rate": 0.00021439644548225983, "loss": 0.0196, "step": 52790 }, { "epoch": 0.57, "learning_rate": 0.0002143802296166569, "loss": 0.0162, "step": 52800 }, { "epoch": 0.57, "learning_rate": 0.00021436401375105402, "loss": 0.0165, "step": 52810 }, { "epoch": 0.57, "learning_rate": 0.0002143477978854511, "loss": 0.0162, "step": 52820 }, { "epoch": 0.57, "learning_rate": 0.0002143315820198482, "loss": 0.0159, "step": 52830 }, { "epoch": 0.57, "learning_rate": 0.0002143153661542453, "loss": 0.0183, "step": 52840 }, { "epoch": 0.57, "learning_rate": 0.0002142991502886424, "loss": 0.0198, "step": 52850 }, { "epoch": 0.57, "learning_rate": 0.00021428293442303948, "loss": 0.0165, "step": 52860 }, { "epoch": 0.57, "learning_rate": 0.0002142667185574366, "loss": 0.0185, "step": 52870 }, { "epoch": 0.57, "learning_rate": 0.00021425050269183367, "loss": 0.0188, "step": 52880 }, { "epoch": 0.57, "learning_rate": 0.00021423428682623076, "loss": 0.0185, "step": 52890 }, { "epoch": 0.57, "learning_rate": 0.00021421807096062785, "loss": 0.0185, "step": 52900 }, { "epoch": 0.57, "learning_rate": 0.00021420185509502497, "loss": 0.0202, "step": 52910 }, { "epoch": 0.57, "learning_rate": 0.00021418563922942204, "loss": 0.0205, "step": 52920 }, { "epoch": 0.57, "learning_rate": 0.00021416942336381913, "loss": 0.0177, "step": 52930 }, { "epoch": 0.57, "learning_rate": 0.00021415320749821625, "loss": 0.0171, "step": 52940 }, { "epoch": 0.57, "learning_rate": 0.00021413699163261334, "loss": 0.0167, "step": 52950 }, { "epoch": 0.57, "learning_rate": 0.0002141207757670104, "loss": 0.0176, "step": 52960 }, { "epoch": 0.57, "learning_rate": 0.0002141045599014075, "loss": 0.0201, "step": 52970 }, { "epoch": 0.57, "learning_rate": 0.00021408834403580462, "loss": 0.0173, "step": 52980 }, { "epoch": 0.57, "learning_rate": 0.0002140721281702017, "loss": 0.0164, "step": 52990 }, { "epoch": 0.57, "learning_rate": 0.00021405591230459878, "loss": 0.0157, "step": 53000 }, { "epoch": 0.57, "eval_cer": 0.9215582042155038, "eval_loss": 0.012771863490343094, "eval_runtime": 121.4029, "eval_samples_per_second": 16.474, "eval_steps_per_second": 4.119, "step": 53000 }, { "epoch": 0.57, "learning_rate": 0.0002140396964389959, "loss": 0.0192, "step": 53010 }, { "epoch": 0.57, "learning_rate": 0.000214023480573393, "loss": 0.0148, "step": 53020 }, { "epoch": 0.57, "learning_rate": 0.00021400726470779008, "loss": 0.0166, "step": 53030 }, { "epoch": 0.57, "learning_rate": 0.00021399104884218718, "loss": 0.0162, "step": 53040 }, { "epoch": 0.57, "learning_rate": 0.00021397483297658427, "loss": 0.0206, "step": 53050 }, { "epoch": 0.57, "learning_rate": 0.00021395861711098136, "loss": 0.0181, "step": 53060 }, { "epoch": 0.57, "learning_rate": 0.00021394240124537848, "loss": 0.0145, "step": 53070 }, { "epoch": 0.57, "learning_rate": 0.00021392618537977555, "loss": 0.0175, "step": 53080 }, { "epoch": 0.57, "learning_rate": 0.00021390996951417264, "loss": 0.0183, "step": 53090 }, { "epoch": 0.57, "learning_rate": 0.00021389375364856973, "loss": 0.0192, "step": 53100 }, { "epoch": 0.57, "learning_rate": 0.00021387753778296685, "loss": 0.0157, "step": 53110 }, { "epoch": 0.57, "learning_rate": 0.00021386132191736392, "loss": 0.02, "step": 53120 }, { "epoch": 0.57, "learning_rate": 0.000213845106051761, "loss": 0.0157, "step": 53130 }, { "epoch": 0.57, "learning_rate": 0.00021382889018615813, "loss": 0.0179, "step": 53140 }, { "epoch": 0.57, "learning_rate": 0.00021381267432055522, "loss": 0.0158, "step": 53150 }, { "epoch": 0.57, "learning_rate": 0.0002137964584549523, "loss": 0.0199, "step": 53160 }, { "epoch": 0.57, "learning_rate": 0.00021378024258934938, "loss": 0.0177, "step": 53170 }, { "epoch": 0.57, "learning_rate": 0.0002137640267237465, "loss": 0.0192, "step": 53180 }, { "epoch": 0.58, "learning_rate": 0.0002137478108581436, "loss": 0.0179, "step": 53190 }, { "epoch": 0.58, "learning_rate": 0.00021373159499254066, "loss": 0.015, "step": 53200 }, { "epoch": 0.58, "learning_rate": 0.00021371537912693778, "loss": 0.017, "step": 53210 }, { "epoch": 0.58, "learning_rate": 0.00021369916326133487, "loss": 0.0158, "step": 53220 }, { "epoch": 0.58, "learning_rate": 0.00021368294739573197, "loss": 0.0199, "step": 53230 }, { "epoch": 0.58, "learning_rate": 0.00021366673153012909, "loss": 0.0152, "step": 53240 }, { "epoch": 0.58, "learning_rate": 0.00021365051566452615, "loss": 0.0198, "step": 53250 }, { "epoch": 0.58, "learning_rate": 0.00021363429979892324, "loss": 0.0166, "step": 53260 }, { "epoch": 0.58, "learning_rate": 0.00021361808393332034, "loss": 0.0154, "step": 53270 }, { "epoch": 0.58, "learning_rate": 0.00021360186806771746, "loss": 0.0175, "step": 53280 }, { "epoch": 0.58, "learning_rate": 0.00021358565220211452, "loss": 0.0138, "step": 53290 }, { "epoch": 0.58, "learning_rate": 0.00021356943633651161, "loss": 0.0177, "step": 53300 }, { "epoch": 0.58, "learning_rate": 0.00021355322047090873, "loss": 0.0166, "step": 53310 }, { "epoch": 0.58, "learning_rate": 0.00021353700460530583, "loss": 0.0133, "step": 53320 }, { "epoch": 0.58, "learning_rate": 0.0002135207887397029, "loss": 0.0169, "step": 53330 }, { "epoch": 0.58, "learning_rate": 0.0002135045728741, "loss": 0.0176, "step": 53340 }, { "epoch": 0.58, "learning_rate": 0.0002134883570084971, "loss": 0.0216, "step": 53350 }, { "epoch": 0.58, "learning_rate": 0.0002134721411428942, "loss": 0.0189, "step": 53360 }, { "epoch": 0.58, "learning_rate": 0.00021345592527729126, "loss": 0.0146, "step": 53370 }, { "epoch": 0.58, "learning_rate": 0.00021343970941168838, "loss": 0.019, "step": 53380 }, { "epoch": 0.58, "learning_rate": 0.00021342349354608548, "loss": 0.0143, "step": 53390 }, { "epoch": 0.58, "learning_rate": 0.00021340727768048257, "loss": 0.0164, "step": 53400 }, { "epoch": 0.58, "learning_rate": 0.00021339106181487966, "loss": 0.0156, "step": 53410 }, { "epoch": 0.58, "learning_rate": 0.00021337484594927675, "loss": 0.0193, "step": 53420 }, { "epoch": 0.58, "learning_rate": 0.00021335863008367385, "loss": 0.0175, "step": 53430 }, { "epoch": 0.58, "learning_rate": 0.00021334241421807097, "loss": 0.0169, "step": 53440 }, { "epoch": 0.58, "learning_rate": 0.00021332619835246803, "loss": 0.0183, "step": 53450 }, { "epoch": 0.58, "learning_rate": 0.00021330998248686513, "loss": 0.0165, "step": 53460 }, { "epoch": 0.58, "learning_rate": 0.00021329376662126222, "loss": 0.0188, "step": 53470 }, { "epoch": 0.58, "learning_rate": 0.00021327755075565934, "loss": 0.0166, "step": 53480 }, { "epoch": 0.58, "learning_rate": 0.0002132613348900564, "loss": 0.0171, "step": 53490 }, { "epoch": 0.58, "learning_rate": 0.0002132451190244535, "loss": 0.0166, "step": 53500 }, { "epoch": 0.58, "learning_rate": 0.00021322890315885062, "loss": 0.017, "step": 53510 }, { "epoch": 0.58, "learning_rate": 0.0002132126872932477, "loss": 0.014, "step": 53520 }, { "epoch": 0.58, "learning_rate": 0.00021319647142764477, "loss": 0.0151, "step": 53530 }, { "epoch": 0.58, "learning_rate": 0.00021318025556204187, "loss": 0.0194, "step": 53540 }, { "epoch": 0.58, "learning_rate": 0.000213164039696439, "loss": 0.0151, "step": 53550 }, { "epoch": 0.58, "learning_rate": 0.00021314782383083608, "loss": 0.0189, "step": 53560 }, { "epoch": 0.58, "learning_rate": 0.00021313160796523315, "loss": 0.0189, "step": 53570 }, { "epoch": 0.58, "learning_rate": 0.00021311539209963027, "loss": 0.0173, "step": 53580 }, { "epoch": 0.58, "learning_rate": 0.00021309917623402736, "loss": 0.0192, "step": 53590 }, { "epoch": 0.58, "learning_rate": 0.00021308296036842445, "loss": 0.0159, "step": 53600 }, { "epoch": 0.58, "learning_rate": 0.00021306674450282152, "loss": 0.0161, "step": 53610 }, { "epoch": 0.58, "learning_rate": 0.00021305052863721864, "loss": 0.0152, "step": 53620 }, { "epoch": 0.58, "learning_rate": 0.00021303431277161573, "loss": 0.0172, "step": 53630 }, { "epoch": 0.58, "learning_rate": 0.00021301809690601285, "loss": 0.0155, "step": 53640 }, { "epoch": 0.58, "learning_rate": 0.00021300188104040991, "loss": 0.0178, "step": 53650 }, { "epoch": 0.58, "learning_rate": 0.000212985665174807, "loss": 0.0158, "step": 53660 }, { "epoch": 0.58, "learning_rate": 0.0002129694493092041, "loss": 0.0171, "step": 53670 }, { "epoch": 0.58, "learning_rate": 0.00021295323344360122, "loss": 0.0177, "step": 53680 }, { "epoch": 0.58, "learning_rate": 0.00021293701757799829, "loss": 0.0163, "step": 53690 }, { "epoch": 0.58, "learning_rate": 0.00021292080171239538, "loss": 0.018, "step": 53700 }, { "epoch": 0.58, "learning_rate": 0.0002129045858467925, "loss": 0.0213, "step": 53710 }, { "epoch": 0.58, "learning_rate": 0.0002128883699811896, "loss": 0.0158, "step": 53720 }, { "epoch": 0.58, "learning_rate": 0.00021287215411558666, "loss": 0.0185, "step": 53730 }, { "epoch": 0.58, "learning_rate": 0.00021285593824998375, "loss": 0.0161, "step": 53740 }, { "epoch": 0.58, "learning_rate": 0.00021283972238438087, "loss": 0.0153, "step": 53750 }, { "epoch": 0.58, "learning_rate": 0.00021282350651877796, "loss": 0.0179, "step": 53760 }, { "epoch": 0.58, "learning_rate": 0.00021280729065317503, "loss": 0.0195, "step": 53770 }, { "epoch": 0.58, "learning_rate": 0.00021279107478757215, "loss": 0.0223, "step": 53780 }, { "epoch": 0.58, "learning_rate": 0.00021277485892196924, "loss": 0.0159, "step": 53790 }, { "epoch": 0.58, "learning_rate": 0.00021275864305636633, "loss": 0.0207, "step": 53800 }, { "epoch": 0.58, "learning_rate": 0.0002127424271907634, "loss": 0.0162, "step": 53810 }, { "epoch": 0.58, "learning_rate": 0.00021272621132516052, "loss": 0.0155, "step": 53820 }, { "epoch": 0.58, "learning_rate": 0.0002127099954595576, "loss": 0.0163, "step": 53830 }, { "epoch": 0.58, "learning_rate": 0.0002126937795939547, "loss": 0.0169, "step": 53840 }, { "epoch": 0.58, "learning_rate": 0.0002126775637283518, "loss": 0.0205, "step": 53850 }, { "epoch": 0.58, "learning_rate": 0.0002126613478627489, "loss": 0.0157, "step": 53860 }, { "epoch": 0.58, "learning_rate": 0.00021264513199714598, "loss": 0.0154, "step": 53870 }, { "epoch": 0.58, "learning_rate": 0.0002126289161315431, "loss": 0.0173, "step": 53880 }, { "epoch": 0.58, "learning_rate": 0.00021261270026594017, "loss": 0.0155, "step": 53890 }, { "epoch": 0.58, "learning_rate": 0.00021259648440033726, "loss": 0.0169, "step": 53900 }, { "epoch": 0.58, "learning_rate": 0.00021258026853473435, "loss": 0.0155, "step": 53910 }, { "epoch": 0.58, "learning_rate": 0.00021256405266913147, "loss": 0.0214, "step": 53920 }, { "epoch": 0.58, "learning_rate": 0.00021254783680352854, "loss": 0.0175, "step": 53930 }, { "epoch": 0.58, "learning_rate": 0.00021253162093792563, "loss": 0.0181, "step": 53940 }, { "epoch": 0.58, "learning_rate": 0.00021251540507232275, "loss": 0.0167, "step": 53950 }, { "epoch": 0.58, "learning_rate": 0.00021249918920671984, "loss": 0.0184, "step": 53960 }, { "epoch": 0.58, "learning_rate": 0.00021248297334111694, "loss": 0.0166, "step": 53970 }, { "epoch": 0.58, "learning_rate": 0.000212466757475514, "loss": 0.0163, "step": 53980 }, { "epoch": 0.58, "learning_rate": 0.00021245054160991112, "loss": 0.0177, "step": 53990 }, { "epoch": 0.58, "learning_rate": 0.00021243432574430822, "loss": 0.0158, "step": 54000 }, { "epoch": 0.58, "eval_cer": 0.9215590728184603, "eval_loss": 0.012681106105446815, "eval_runtime": 121.7214, "eval_samples_per_second": 16.431, "eval_steps_per_second": 4.108, "step": 54000 }, { "epoch": 0.58, "learning_rate": 0.00021241810987870533, "loss": 0.0182, "step": 54010 }, { "epoch": 0.58, "learning_rate": 0.0002124018940131024, "loss": 0.0187, "step": 54020 }, { "epoch": 0.58, "learning_rate": 0.0002123856781474995, "loss": 0.0187, "step": 54030 }, { "epoch": 0.58, "learning_rate": 0.00021236946228189659, "loss": 0.0199, "step": 54040 }, { "epoch": 0.58, "learning_rate": 0.0002123532464162937, "loss": 0.0162, "step": 54050 }, { "epoch": 0.58, "learning_rate": 0.00021233703055069077, "loss": 0.0164, "step": 54060 }, { "epoch": 0.58, "learning_rate": 0.00021232081468508786, "loss": 0.0174, "step": 54070 }, { "epoch": 0.58, "learning_rate": 0.00021230459881948498, "loss": 0.0185, "step": 54080 }, { "epoch": 0.58, "learning_rate": 0.00021228838295388208, "loss": 0.0207, "step": 54090 }, { "epoch": 0.58, "learning_rate": 0.00021227216708827914, "loss": 0.0186, "step": 54100 }, { "epoch": 0.58, "learning_rate": 0.00021225595122267624, "loss": 0.0153, "step": 54110 }, { "epoch": 0.59, "learning_rate": 0.00021223973535707336, "loss": 0.0168, "step": 54120 }, { "epoch": 0.59, "learning_rate": 0.00021222351949147045, "loss": 0.0192, "step": 54130 }, { "epoch": 0.59, "learning_rate": 0.0002122073036258675, "loss": 0.0167, "step": 54140 }, { "epoch": 0.59, "learning_rate": 0.00021219108776026463, "loss": 0.0176, "step": 54150 }, { "epoch": 0.59, "learning_rate": 0.00021217487189466173, "loss": 0.0186, "step": 54160 }, { "epoch": 0.59, "learning_rate": 0.00021215865602905882, "loss": 0.0185, "step": 54170 }, { "epoch": 0.59, "learning_rate": 0.00021214244016345588, "loss": 0.0222, "step": 54180 }, { "epoch": 0.59, "learning_rate": 0.000212126224297853, "loss": 0.0182, "step": 54190 }, { "epoch": 0.59, "learning_rate": 0.0002121100084322501, "loss": 0.0195, "step": 54200 }, { "epoch": 0.59, "learning_rate": 0.0002120937925666472, "loss": 0.0179, "step": 54210 }, { "epoch": 0.59, "learning_rate": 0.00021207757670104428, "loss": 0.0137, "step": 54220 }, { "epoch": 0.59, "learning_rate": 0.00021206136083544138, "loss": 0.0163, "step": 54230 }, { "epoch": 0.59, "learning_rate": 0.00021204514496983847, "loss": 0.0199, "step": 54240 }, { "epoch": 0.59, "learning_rate": 0.0002120289291042356, "loss": 0.0165, "step": 54250 }, { "epoch": 0.59, "learning_rate": 0.00021201271323863265, "loss": 0.0203, "step": 54260 }, { "epoch": 0.59, "learning_rate": 0.00021199649737302975, "loss": 0.0153, "step": 54270 }, { "epoch": 0.59, "learning_rate": 0.00021198028150742684, "loss": 0.0126, "step": 54280 }, { "epoch": 0.59, "learning_rate": 0.00021196406564182396, "loss": 0.0142, "step": 54290 }, { "epoch": 0.59, "learning_rate": 0.00021194784977622102, "loss": 0.0192, "step": 54300 }, { "epoch": 0.59, "learning_rate": 0.00021193163391061812, "loss": 0.0189, "step": 54310 }, { "epoch": 0.59, "learning_rate": 0.00021191541804501524, "loss": 0.0189, "step": 54320 }, { "epoch": 0.59, "learning_rate": 0.00021189920217941233, "loss": 0.0179, "step": 54330 }, { "epoch": 0.59, "learning_rate": 0.0002118829863138094, "loss": 0.0151, "step": 54340 }, { "epoch": 0.59, "learning_rate": 0.00021186677044820652, "loss": 0.017, "step": 54350 }, { "epoch": 0.59, "learning_rate": 0.0002118505545826036, "loss": 0.0222, "step": 54360 }, { "epoch": 0.59, "learning_rate": 0.0002118343387170007, "loss": 0.0186, "step": 54370 }, { "epoch": 0.59, "learning_rate": 0.00021181812285139777, "loss": 0.0169, "step": 54380 }, { "epoch": 0.59, "learning_rate": 0.00021180190698579489, "loss": 0.0186, "step": 54390 }, { "epoch": 0.59, "learning_rate": 0.00021178569112019198, "loss": 0.0201, "step": 54400 }, { "epoch": 0.59, "learning_rate": 0.00021176947525458907, "loss": 0.0159, "step": 54410 }, { "epoch": 0.59, "learning_rate": 0.00021175325938898616, "loss": 0.0175, "step": 54420 }, { "epoch": 0.59, "learning_rate": 0.00021173704352338326, "loss": 0.0181, "step": 54430 }, { "epoch": 0.59, "learning_rate": 0.00021172082765778035, "loss": 0.014, "step": 54440 }, { "epoch": 0.59, "learning_rate": 0.00021170461179217747, "loss": 0.0172, "step": 54450 }, { "epoch": 0.59, "learning_rate": 0.00021168839592657454, "loss": 0.0188, "step": 54460 }, { "epoch": 0.59, "learning_rate": 0.00021167218006097163, "loss": 0.0175, "step": 54470 }, { "epoch": 0.59, "learning_rate": 0.00021165596419536872, "loss": 0.0191, "step": 54480 }, { "epoch": 0.59, "learning_rate": 0.00021163974832976584, "loss": 0.014, "step": 54490 }, { "epoch": 0.59, "learning_rate": 0.0002116235324641629, "loss": 0.0165, "step": 54500 }, { "epoch": 0.59, "learning_rate": 0.00021160731659856, "loss": 0.0128, "step": 54510 }, { "epoch": 0.59, "learning_rate": 0.00021159110073295712, "loss": 0.0141, "step": 54520 }, { "epoch": 0.59, "learning_rate": 0.0002115748848673542, "loss": 0.015, "step": 54530 }, { "epoch": 0.59, "learning_rate": 0.00021155866900175128, "loss": 0.0166, "step": 54540 }, { "epoch": 0.59, "learning_rate": 0.00021154245313614837, "loss": 0.015, "step": 54550 }, { "epoch": 0.59, "learning_rate": 0.0002115262372705455, "loss": 0.0173, "step": 54560 }, { "epoch": 0.59, "learning_rate": 0.00021151002140494258, "loss": 0.0181, "step": 54570 }, { "epoch": 0.59, "learning_rate": 0.00021149380553933965, "loss": 0.0141, "step": 54580 }, { "epoch": 0.59, "learning_rate": 0.00021147758967373677, "loss": 0.0238, "step": 54590 }, { "epoch": 0.59, "learning_rate": 0.00021146137380813386, "loss": 0.0167, "step": 54600 }, { "epoch": 0.59, "learning_rate": 0.00021144515794253095, "loss": 0.0187, "step": 54610 }, { "epoch": 0.59, "learning_rate": 0.00021142894207692802, "loss": 0.0152, "step": 54620 }, { "epoch": 0.59, "learning_rate": 0.00021141272621132514, "loss": 0.0171, "step": 54630 }, { "epoch": 0.59, "learning_rate": 0.00021139651034572223, "loss": 0.0147, "step": 54640 }, { "epoch": 0.59, "learning_rate": 0.00021138029448011935, "loss": 0.0187, "step": 54650 }, { "epoch": 0.59, "learning_rate": 0.00021136407861451642, "loss": 0.0158, "step": 54660 }, { "epoch": 0.59, "learning_rate": 0.0002113478627489135, "loss": 0.0152, "step": 54670 }, { "epoch": 0.59, "learning_rate": 0.0002113316468833106, "loss": 0.0163, "step": 54680 }, { "epoch": 0.59, "learning_rate": 0.00021131543101770772, "loss": 0.0161, "step": 54690 }, { "epoch": 0.59, "learning_rate": 0.00021129921515210482, "loss": 0.0158, "step": 54700 }, { "epoch": 0.59, "learning_rate": 0.00021128299928650188, "loss": 0.0166, "step": 54710 }, { "epoch": 0.59, "learning_rate": 0.000211266783420899, "loss": 0.02, "step": 54720 }, { "epoch": 0.59, "learning_rate": 0.0002112505675552961, "loss": 0.0176, "step": 54730 }, { "epoch": 0.59, "learning_rate": 0.0002112343516896932, "loss": 0.0177, "step": 54740 }, { "epoch": 0.59, "learning_rate": 0.00021121813582409025, "loss": 0.0151, "step": 54750 }, { "epoch": 0.59, "learning_rate": 0.00021120191995848737, "loss": 0.0173, "step": 54760 }, { "epoch": 0.59, "learning_rate": 0.00021118570409288446, "loss": 0.0147, "step": 54770 }, { "epoch": 0.59, "learning_rate": 0.00021116948822728156, "loss": 0.02, "step": 54780 }, { "epoch": 0.59, "learning_rate": 0.00021115327236167865, "loss": 0.0149, "step": 54790 }, { "epoch": 0.59, "learning_rate": 0.00021113705649607574, "loss": 0.0157, "step": 54800 }, { "epoch": 0.59, "learning_rate": 0.00021112084063047284, "loss": 0.0208, "step": 54810 }, { "epoch": 0.59, "learning_rate": 0.00021110462476486996, "loss": 0.0162, "step": 54820 }, { "epoch": 0.59, "learning_rate": 0.00021108840889926702, "loss": 0.0189, "step": 54830 }, { "epoch": 0.59, "learning_rate": 0.00021107219303366411, "loss": 0.0163, "step": 54840 }, { "epoch": 0.59, "learning_rate": 0.0002110559771680612, "loss": 0.0178, "step": 54850 }, { "epoch": 0.59, "learning_rate": 0.00021103976130245833, "loss": 0.0164, "step": 54860 }, { "epoch": 0.59, "learning_rate": 0.0002110235454368554, "loss": 0.0137, "step": 54870 }, { "epoch": 0.59, "learning_rate": 0.00021100732957125248, "loss": 0.0156, "step": 54880 }, { "epoch": 0.59, "learning_rate": 0.0002109911137056496, "loss": 0.0162, "step": 54890 }, { "epoch": 0.59, "learning_rate": 0.0002109748978400467, "loss": 0.0179, "step": 54900 }, { "epoch": 0.59, "learning_rate": 0.00021095868197444376, "loss": 0.0172, "step": 54910 }, { "epoch": 0.59, "learning_rate": 0.00021094246610884086, "loss": 0.0175, "step": 54920 }, { "epoch": 0.59, "learning_rate": 0.00021092625024323798, "loss": 0.0188, "step": 54930 }, { "epoch": 0.59, "learning_rate": 0.00021091003437763507, "loss": 0.013, "step": 54940 }, { "epoch": 0.59, "learning_rate": 0.00021089381851203213, "loss": 0.0161, "step": 54950 }, { "epoch": 0.59, "learning_rate": 0.00021087760264642925, "loss": 0.0192, "step": 54960 }, { "epoch": 0.59, "learning_rate": 0.00021086138678082635, "loss": 0.0162, "step": 54970 }, { "epoch": 0.59, "learning_rate": 0.00021084517091522344, "loss": 0.017, "step": 54980 }, { "epoch": 0.59, "learning_rate": 0.0002108289550496205, "loss": 0.0144, "step": 54990 }, { "epoch": 0.59, "learning_rate": 0.00021081273918401762, "loss": 0.0145, "step": 55000 }, { "epoch": 0.59, "eval_cer": 0.9215616786273294, "eval_loss": 0.011711681261658669, "eval_runtime": 121.4424, "eval_samples_per_second": 16.469, "eval_steps_per_second": 4.117, "step": 55000 }, { "epoch": 0.59, "learning_rate": 0.00021079652331841472, "loss": 0.0172, "step": 55010 }, { "epoch": 0.59, "learning_rate": 0.00021078030745281184, "loss": 0.0183, "step": 55020 }, { "epoch": 0.59, "learning_rate": 0.0002107640915872089, "loss": 0.0169, "step": 55030 }, { "epoch": 0.6, "learning_rate": 0.000210747875721606, "loss": 0.0184, "step": 55040 }, { "epoch": 0.6, "learning_rate": 0.0002107316598560031, "loss": 0.0166, "step": 55050 }, { "epoch": 0.6, "learning_rate": 0.0002107154439904002, "loss": 0.0207, "step": 55060 }, { "epoch": 0.6, "learning_rate": 0.00021069922812479727, "loss": 0.0196, "step": 55070 }, { "epoch": 0.6, "learning_rate": 0.00021068301225919437, "loss": 0.0197, "step": 55080 }, { "epoch": 0.6, "learning_rate": 0.0002106667963935915, "loss": 0.0178, "step": 55090 }, { "epoch": 0.6, "learning_rate": 0.00021065058052798858, "loss": 0.0149, "step": 55100 }, { "epoch": 0.6, "learning_rate": 0.00021063436466238565, "loss": 0.0175, "step": 55110 }, { "epoch": 0.6, "learning_rate": 0.00021061814879678274, "loss": 0.018, "step": 55120 }, { "epoch": 0.6, "learning_rate": 0.00021060193293117986, "loss": 0.0159, "step": 55130 }, { "epoch": 0.6, "learning_rate": 0.00021058571706557695, "loss": 0.0153, "step": 55140 }, { "epoch": 0.6, "learning_rate": 0.00021056950119997402, "loss": 0.015, "step": 55150 }, { "epoch": 0.6, "learning_rate": 0.00021055328533437114, "loss": 0.019, "step": 55160 }, { "epoch": 0.6, "learning_rate": 0.00021053706946876823, "loss": 0.0166, "step": 55170 }, { "epoch": 0.6, "learning_rate": 0.00021052085360316532, "loss": 0.0205, "step": 55180 }, { "epoch": 0.6, "learning_rate": 0.0002105046377375624, "loss": 0.0164, "step": 55190 }, { "epoch": 0.6, "learning_rate": 0.0002104884218719595, "loss": 0.0151, "step": 55200 }, { "epoch": 0.6, "learning_rate": 0.0002104722060063566, "loss": 0.0191, "step": 55210 }, { "epoch": 0.6, "learning_rate": 0.0002104559901407537, "loss": 0.0162, "step": 55220 }, { "epoch": 0.6, "learning_rate": 0.00021043977427515079, "loss": 0.0248, "step": 55230 }, { "epoch": 0.6, "learning_rate": 0.00021042355840954788, "loss": 0.019, "step": 55240 }, { "epoch": 0.6, "learning_rate": 0.00021040734254394497, "loss": 0.0193, "step": 55250 }, { "epoch": 0.6, "learning_rate": 0.0002103911266783421, "loss": 0.0174, "step": 55260 }, { "epoch": 0.6, "learning_rate": 0.00021037491081273916, "loss": 0.0193, "step": 55270 }, { "epoch": 0.6, "learning_rate": 0.00021035869494713625, "loss": 0.017, "step": 55280 }, { "epoch": 0.6, "learning_rate": 0.00021034247908153334, "loss": 0.0196, "step": 55290 }, { "epoch": 0.6, "learning_rate": 0.00021032626321593046, "loss": 0.0167, "step": 55300 }, { "epoch": 0.6, "learning_rate": 0.00021031004735032753, "loss": 0.0176, "step": 55310 }, { "epoch": 0.6, "learning_rate": 0.00021029383148472462, "loss": 0.0206, "step": 55320 }, { "epoch": 0.6, "learning_rate": 0.00021027761561912174, "loss": 0.0334, "step": 55330 }, { "epoch": 0.6, "learning_rate": 0.00021026139975351883, "loss": 0.0188, "step": 55340 }, { "epoch": 0.6, "learning_rate": 0.0002102451838879159, "loss": 0.0157, "step": 55350 }, { "epoch": 0.6, "learning_rate": 0.00021022896802231302, "loss": 0.0189, "step": 55360 }, { "epoch": 0.6, "learning_rate": 0.0002102127521567101, "loss": 0.0183, "step": 55370 }, { "epoch": 0.6, "learning_rate": 0.0002101965362911072, "loss": 0.0206, "step": 55380 }, { "epoch": 0.6, "learning_rate": 0.00021018032042550432, "loss": 0.02, "step": 55390 }, { "epoch": 0.6, "learning_rate": 0.0002101641045599014, "loss": 0.0156, "step": 55400 }, { "epoch": 0.6, "learning_rate": 0.00021014788869429848, "loss": 0.0167, "step": 55410 }, { "epoch": 0.6, "learning_rate": 0.00021013167282869557, "loss": 0.0166, "step": 55420 }, { "epoch": 0.6, "learning_rate": 0.0002101154569630927, "loss": 0.0151, "step": 55430 }, { "epoch": 0.6, "learning_rate": 0.00021009924109748976, "loss": 0.0168, "step": 55440 }, { "epoch": 0.6, "learning_rate": 0.00021008302523188685, "loss": 0.0158, "step": 55450 }, { "epoch": 0.6, "learning_rate": 0.00021006680936628397, "loss": 0.0168, "step": 55460 }, { "epoch": 0.6, "learning_rate": 0.00021005059350068107, "loss": 0.0177, "step": 55470 }, { "epoch": 0.6, "learning_rate": 0.00021003437763507813, "loss": 0.0176, "step": 55480 }, { "epoch": 0.6, "learning_rate": 0.00021001816176947522, "loss": 0.0175, "step": 55490 }, { "epoch": 0.6, "learning_rate": 0.00021000194590387234, "loss": 0.0157, "step": 55500 }, { "epoch": 0.6, "learning_rate": 0.00020998573003826944, "loss": 0.0178, "step": 55510 }, { "epoch": 0.6, "learning_rate": 0.0002099695141726665, "loss": 0.0161, "step": 55520 }, { "epoch": 0.6, "learning_rate": 0.00020995329830706362, "loss": 0.0163, "step": 55530 }, { "epoch": 0.6, "learning_rate": 0.00020993708244146071, "loss": 0.0146, "step": 55540 }, { "epoch": 0.6, "learning_rate": 0.0002099208665758578, "loss": 0.018, "step": 55550 }, { "epoch": 0.6, "learning_rate": 0.00020990465071025487, "loss": 0.0166, "step": 55560 }, { "epoch": 0.6, "learning_rate": 0.000209888434844652, "loss": 0.0208, "step": 55570 }, { "epoch": 0.6, "learning_rate": 0.00020987221897904909, "loss": 0.0177, "step": 55580 }, { "epoch": 0.6, "learning_rate": 0.00020985600311344618, "loss": 0.0191, "step": 55590 }, { "epoch": 0.6, "learning_rate": 0.00020983978724784327, "loss": 0.0172, "step": 55600 }, { "epoch": 0.6, "learning_rate": 0.00020982357138224036, "loss": 0.0168, "step": 55610 }, { "epoch": 0.6, "learning_rate": 0.00020980735551663746, "loss": 0.0173, "step": 55620 }, { "epoch": 0.6, "learning_rate": 0.00020979113965103458, "loss": 0.0194, "step": 55630 }, { "epoch": 0.6, "learning_rate": 0.00020977492378543164, "loss": 0.0158, "step": 55640 }, { "epoch": 0.6, "learning_rate": 0.00020975870791982873, "loss": 0.0146, "step": 55650 }, { "epoch": 0.6, "learning_rate": 0.00020974249205422585, "loss": 0.019, "step": 55660 }, { "epoch": 0.6, "learning_rate": 0.00020972627618862295, "loss": 0.0187, "step": 55670 }, { "epoch": 0.6, "learning_rate": 0.00020971006032302, "loss": 0.0182, "step": 55680 }, { "epoch": 0.6, "learning_rate": 0.0002096938444574171, "loss": 0.0209, "step": 55690 }, { "epoch": 0.6, "learning_rate": 0.00020967762859181423, "loss": 0.02, "step": 55700 }, { "epoch": 0.6, "learning_rate": 0.00020966141272621132, "loss": 0.0182, "step": 55710 }, { "epoch": 0.6, "learning_rate": 0.00020964519686060838, "loss": 0.0164, "step": 55720 }, { "epoch": 0.6, "learning_rate": 0.0002096289809950055, "loss": 0.0171, "step": 55730 }, { "epoch": 0.6, "learning_rate": 0.0002096127651294026, "loss": 0.0181, "step": 55740 }, { "epoch": 0.6, "learning_rate": 0.0002095965492637997, "loss": 0.0159, "step": 55750 }, { "epoch": 0.6, "learning_rate": 0.00020958033339819675, "loss": 0.0156, "step": 55760 }, { "epoch": 0.6, "learning_rate": 0.00020956411753259387, "loss": 0.0193, "step": 55770 }, { "epoch": 0.6, "learning_rate": 0.00020954790166699097, "loss": 0.0182, "step": 55780 }, { "epoch": 0.6, "learning_rate": 0.00020953168580138806, "loss": 0.0183, "step": 55790 }, { "epoch": 0.6, "learning_rate": 0.00020951546993578515, "loss": 0.018, "step": 55800 }, { "epoch": 0.6, "learning_rate": 0.00020949925407018225, "loss": 0.0191, "step": 55810 }, { "epoch": 0.6, "learning_rate": 0.00020948303820457934, "loss": 0.0168, "step": 55820 }, { "epoch": 0.6, "learning_rate": 0.00020946682233897646, "loss": 0.0143, "step": 55830 }, { "epoch": 0.6, "learning_rate": 0.00020945060647337352, "loss": 0.0145, "step": 55840 }, { "epoch": 0.6, "learning_rate": 0.00020943439060777062, "loss": 0.0165, "step": 55850 }, { "epoch": 0.6, "learning_rate": 0.0002094181747421677, "loss": 0.0163, "step": 55860 }, { "epoch": 0.6, "learning_rate": 0.00020940195887656483, "loss": 0.0188, "step": 55870 }, { "epoch": 0.6, "learning_rate": 0.0002093857430109619, "loss": 0.0178, "step": 55880 }, { "epoch": 0.6, "learning_rate": 0.000209369527145359, "loss": 0.0193, "step": 55890 }, { "epoch": 0.6, "learning_rate": 0.0002093533112797561, "loss": 0.0196, "step": 55900 }, { "epoch": 0.6, "learning_rate": 0.0002093370954141532, "loss": 0.0154, "step": 55910 }, { "epoch": 0.6, "learning_rate": 0.00020932087954855027, "loss": 0.017, "step": 55920 }, { "epoch": 0.6, "learning_rate": 0.00020930466368294736, "loss": 0.0166, "step": 55930 }, { "epoch": 0.6, "learning_rate": 0.00020928844781734448, "loss": 0.0149, "step": 55940 }, { "epoch": 0.6, "learning_rate": 0.00020927223195174157, "loss": 0.0173, "step": 55950 }, { "epoch": 0.6, "learning_rate": 0.00020925601608613864, "loss": 0.0212, "step": 55960 }, { "epoch": 0.61, "learning_rate": 0.00020923980022053576, "loss": 0.0189, "step": 55970 }, { "epoch": 0.61, "learning_rate": 0.00020922358435493285, "loss": 0.0167, "step": 55980 }, { "epoch": 0.61, "learning_rate": 0.00020920736848932994, "loss": 0.0172, "step": 55990 }, { "epoch": 0.61, "learning_rate": 0.000209191152623727, "loss": 0.0148, "step": 56000 }, { "epoch": 0.61, "eval_cer": 0.9215573356125475, "eval_loss": 0.01228960882872343, "eval_runtime": 121.224, "eval_samples_per_second": 16.498, "eval_steps_per_second": 4.125, "step": 56000 }, { "epoch": 0.61, "learning_rate": 0.00020917493675812413, "loss": 0.0161, "step": 56010 }, { "epoch": 0.61, "learning_rate": 0.00020915872089252122, "loss": 0.0183, "step": 56020 }, { "epoch": 0.61, "learning_rate": 0.00020914250502691834, "loss": 0.0171, "step": 56030 }, { "epoch": 0.61, "learning_rate": 0.0002091262891613154, "loss": 0.0174, "step": 56040 }, { "epoch": 0.61, "learning_rate": 0.0002091100732957125, "loss": 0.0163, "step": 56050 }, { "epoch": 0.61, "learning_rate": 0.0002090938574301096, "loss": 0.0181, "step": 56060 }, { "epoch": 0.61, "learning_rate": 0.0002090776415645067, "loss": 0.0169, "step": 56070 }, { "epoch": 0.61, "learning_rate": 0.00020906142569890378, "loss": 0.0175, "step": 56080 }, { "epoch": 0.61, "learning_rate": 0.00020904520983330087, "loss": 0.0202, "step": 56090 }, { "epoch": 0.61, "learning_rate": 0.000209028993967698, "loss": 0.0169, "step": 56100 }, { "epoch": 0.61, "learning_rate": 0.00020901277810209508, "loss": 0.0188, "step": 56110 }, { "epoch": 0.61, "learning_rate": 0.00020899656223649217, "loss": 0.0153, "step": 56120 }, { "epoch": 0.61, "learning_rate": 0.00020898034637088924, "loss": 0.0161, "step": 56130 }, { "epoch": 0.61, "learning_rate": 0.00020896413050528636, "loss": 0.0165, "step": 56140 }, { "epoch": 0.61, "learning_rate": 0.00020894791463968345, "loss": 0.0131, "step": 56150 }, { "epoch": 0.61, "learning_rate": 0.00020893169877408055, "loss": 0.0206, "step": 56160 }, { "epoch": 0.61, "learning_rate": 0.00020891548290847764, "loss": 0.0126, "step": 56170 }, { "epoch": 0.61, "learning_rate": 0.00020889926704287473, "loss": 0.016, "step": 56180 }, { "epoch": 0.61, "learning_rate": 0.00020888305117727182, "loss": 0.016, "step": 56190 }, { "epoch": 0.61, "learning_rate": 0.00020886683531166894, "loss": 0.0174, "step": 56200 }, { "epoch": 0.61, "learning_rate": 0.000208850619446066, "loss": 0.019, "step": 56210 }, { "epoch": 0.61, "learning_rate": 0.0002088344035804631, "loss": 0.0191, "step": 56220 }, { "epoch": 0.61, "learning_rate": 0.0002088181877148602, "loss": 0.0148, "step": 56230 }, { "epoch": 0.61, "learning_rate": 0.00020880197184925731, "loss": 0.0162, "step": 56240 }, { "epoch": 0.61, "learning_rate": 0.00020878575598365438, "loss": 0.0178, "step": 56250 }, { "epoch": 0.61, "learning_rate": 0.00020876954011805147, "loss": 0.0149, "step": 56260 }, { "epoch": 0.61, "learning_rate": 0.0002087533242524486, "loss": 0.0201, "step": 56270 }, { "epoch": 0.61, "learning_rate": 0.00020873710838684569, "loss": 0.0167, "step": 56280 }, { "epoch": 0.61, "learning_rate": 0.00020872089252124275, "loss": 0.0192, "step": 56290 }, { "epoch": 0.61, "learning_rate": 0.00020870467665563984, "loss": 0.0156, "step": 56300 }, { "epoch": 0.61, "learning_rate": 0.00020868846079003696, "loss": 0.0178, "step": 56310 }, { "epoch": 0.61, "learning_rate": 0.00020867224492443406, "loss": 0.018, "step": 56320 }, { "epoch": 0.61, "learning_rate": 0.00020865602905883112, "loss": 0.0135, "step": 56330 }, { "epoch": 0.61, "learning_rate": 0.00020863981319322824, "loss": 0.0181, "step": 56340 }, { "epoch": 0.61, "learning_rate": 0.00020862359732762534, "loss": 0.0189, "step": 56350 }, { "epoch": 0.61, "learning_rate": 0.00020860738146202243, "loss": 0.0144, "step": 56360 }, { "epoch": 0.61, "learning_rate": 0.00020859116559641952, "loss": 0.0185, "step": 56370 }, { "epoch": 0.61, "learning_rate": 0.0002085749497308166, "loss": 0.0138, "step": 56380 }, { "epoch": 0.61, "learning_rate": 0.0002085587338652137, "loss": 0.0165, "step": 56390 }, { "epoch": 0.61, "learning_rate": 0.00020854251799961083, "loss": 0.0173, "step": 56400 }, { "epoch": 0.61, "learning_rate": 0.0002085263021340079, "loss": 0.0185, "step": 56410 }, { "epoch": 0.61, "learning_rate": 0.00020851008626840498, "loss": 0.0162, "step": 56420 }, { "epoch": 0.61, "learning_rate": 0.00020849387040280208, "loss": 0.0155, "step": 56430 }, { "epoch": 0.61, "learning_rate": 0.0002084776545371992, "loss": 0.019, "step": 56440 }, { "epoch": 0.61, "learning_rate": 0.00020846143867159626, "loss": 0.0174, "step": 56450 }, { "epoch": 0.61, "learning_rate": 0.00020844522280599336, "loss": 0.0147, "step": 56460 }, { "epoch": 0.61, "learning_rate": 0.00020842900694039048, "loss": 0.0163, "step": 56470 }, { "epoch": 0.61, "learning_rate": 0.00020841279107478757, "loss": 0.0185, "step": 56480 }, { "epoch": 0.61, "learning_rate": 0.00020839657520918463, "loss": 0.016, "step": 56490 }, { "epoch": 0.61, "learning_rate": 0.00020838035934358173, "loss": 0.0161, "step": 56500 }, { "epoch": 0.61, "learning_rate": 0.00020836414347797885, "loss": 0.0233, "step": 56510 }, { "epoch": 0.61, "learning_rate": 0.00020834792761237594, "loss": 0.0176, "step": 56520 }, { "epoch": 0.61, "learning_rate": 0.000208331711746773, "loss": 0.0177, "step": 56530 }, { "epoch": 0.61, "learning_rate": 0.00020831549588117012, "loss": 0.0149, "step": 56540 }, { "epoch": 0.61, "learning_rate": 0.00020829928001556722, "loss": 0.015, "step": 56550 }, { "epoch": 0.61, "learning_rate": 0.0002082830641499643, "loss": 0.0143, "step": 56560 }, { "epoch": 0.61, "learning_rate": 0.00020826684828436138, "loss": 0.0145, "step": 56570 }, { "epoch": 0.61, "learning_rate": 0.0002082506324187585, "loss": 0.0178, "step": 56580 }, { "epoch": 0.61, "learning_rate": 0.0002082344165531556, "loss": 0.0209, "step": 56590 }, { "epoch": 0.61, "learning_rate": 0.00020821820068755268, "loss": 0.016, "step": 56600 }, { "epoch": 0.61, "learning_rate": 0.00020820198482194977, "loss": 0.0178, "step": 56610 }, { "epoch": 0.61, "learning_rate": 0.00020818576895634687, "loss": 0.015, "step": 56620 }, { "epoch": 0.61, "learning_rate": 0.00020816955309074396, "loss": 0.0179, "step": 56630 }, { "epoch": 0.61, "learning_rate": 0.00020815333722514108, "loss": 0.019, "step": 56640 }, { "epoch": 0.61, "learning_rate": 0.00020813712135953814, "loss": 0.015, "step": 56650 }, { "epoch": 0.61, "learning_rate": 0.00020812090549393524, "loss": 0.0187, "step": 56660 }, { "epoch": 0.61, "learning_rate": 0.00020810468962833236, "loss": 0.0156, "step": 56670 }, { "epoch": 0.61, "learning_rate": 0.00020808847376272945, "loss": 0.017, "step": 56680 }, { "epoch": 0.61, "learning_rate": 0.00020807225789712652, "loss": 0.0147, "step": 56690 }, { "epoch": 0.61, "learning_rate": 0.0002080560420315236, "loss": 0.0163, "step": 56700 }, { "epoch": 0.61, "learning_rate": 0.00020803982616592073, "loss": 0.0158, "step": 56710 }, { "epoch": 0.61, "learning_rate": 0.00020802361030031782, "loss": 0.0167, "step": 56720 }, { "epoch": 0.61, "learning_rate": 0.0002080073944347149, "loss": 0.0173, "step": 56730 }, { "epoch": 0.61, "learning_rate": 0.000207991178569112, "loss": 0.0188, "step": 56740 }, { "epoch": 0.61, "learning_rate": 0.0002079749627035091, "loss": 0.0181, "step": 56750 }, { "epoch": 0.61, "learning_rate": 0.0002079587468379062, "loss": 0.0164, "step": 56760 }, { "epoch": 0.61, "learning_rate": 0.00020794253097230326, "loss": 0.0176, "step": 56770 }, { "epoch": 0.61, "learning_rate": 0.00020792631510670038, "loss": 0.012, "step": 56780 }, { "epoch": 0.61, "learning_rate": 0.00020791009924109747, "loss": 0.0172, "step": 56790 }, { "epoch": 0.61, "learning_rate": 0.00020789388337549456, "loss": 0.0146, "step": 56800 }, { "epoch": 0.61, "learning_rate": 0.00020787766750989166, "loss": 0.0138, "step": 56810 }, { "epoch": 0.61, "learning_rate": 0.00020786145164428875, "loss": 0.0176, "step": 56820 }, { "epoch": 0.61, "learning_rate": 0.00020784523577868584, "loss": 0.0154, "step": 56830 }, { "epoch": 0.61, "learning_rate": 0.00020782901991308296, "loss": 0.0151, "step": 56840 }, { "epoch": 0.61, "learning_rate": 0.00020781280404748005, "loss": 0.0171, "step": 56850 }, { "epoch": 0.61, "learning_rate": 0.00020779658818187712, "loss": 0.0147, "step": 56860 }, { "epoch": 0.61, "learning_rate": 0.0002077803723162742, "loss": 0.0163, "step": 56870 }, { "epoch": 0.61, "learning_rate": 0.00020776415645067133, "loss": 0.0212, "step": 56880 }, { "epoch": 0.62, "learning_rate": 0.00020774794058506842, "loss": 0.0164, "step": 56890 }, { "epoch": 0.62, "learning_rate": 0.0002077317247194655, "loss": 0.0164, "step": 56900 }, { "epoch": 0.62, "learning_rate": 0.0002077155088538626, "loss": 0.0173, "step": 56910 }, { "epoch": 0.62, "learning_rate": 0.0002076992929882597, "loss": 0.0177, "step": 56920 }, { "epoch": 0.62, "learning_rate": 0.0002076830771226568, "loss": 0.0133, "step": 56930 }, { "epoch": 0.62, "learning_rate": 0.00020766686125705386, "loss": 0.0188, "step": 56940 }, { "epoch": 0.62, "learning_rate": 0.00020765064539145098, "loss": 0.0149, "step": 56950 }, { "epoch": 0.62, "learning_rate": 0.00020763442952584807, "loss": 0.0164, "step": 56960 }, { "epoch": 0.62, "learning_rate": 0.0002076182136602452, "loss": 0.0166, "step": 56970 }, { "epoch": 0.62, "learning_rate": 0.00020760199779464226, "loss": 0.0141, "step": 56980 }, { "epoch": 0.62, "learning_rate": 0.00020758578192903935, "loss": 0.0154, "step": 56990 }, { "epoch": 0.62, "learning_rate": 0.00020756956606343644, "loss": 0.0153, "step": 57000 }, { "epoch": 0.62, "eval_cer": 0.9215564670095912, "eval_loss": 0.01153921615332365, "eval_runtime": 121.3157, "eval_samples_per_second": 16.486, "eval_steps_per_second": 4.121, "step": 57000 }, { "epoch": 0.62, "learning_rate": 0.00020755335019783356, "loss": 0.0154, "step": 57010 }, { "epoch": 0.62, "learning_rate": 0.00020753713433223063, "loss": 0.0172, "step": 57020 }, { "epoch": 0.62, "learning_rate": 0.00020752091846662772, "loss": 0.015, "step": 57030 }, { "epoch": 0.62, "learning_rate": 0.00020750470260102484, "loss": 0.0174, "step": 57040 }, { "epoch": 0.62, "learning_rate": 0.00020748848673542194, "loss": 0.0205, "step": 57050 }, { "epoch": 0.62, "learning_rate": 0.000207472270869819, "loss": 0.017, "step": 57060 }, { "epoch": 0.62, "learning_rate": 0.0002074560550042161, "loss": 0.0206, "step": 57070 }, { "epoch": 0.62, "learning_rate": 0.00020743983913861321, "loss": 0.0182, "step": 57080 }, { "epoch": 0.62, "learning_rate": 0.0002074236232730103, "loss": 0.0161, "step": 57090 }, { "epoch": 0.62, "learning_rate": 0.00020740740740740737, "loss": 0.0149, "step": 57100 }, { "epoch": 0.62, "learning_rate": 0.0002073911915418045, "loss": 0.0153, "step": 57110 }, { "epoch": 0.62, "learning_rate": 0.00020737497567620158, "loss": 0.0175, "step": 57120 }, { "epoch": 0.62, "learning_rate": 0.00020735875981059868, "loss": 0.0142, "step": 57130 }, { "epoch": 0.62, "learning_rate": 0.00020734254394499574, "loss": 0.0206, "step": 57140 }, { "epoch": 0.62, "learning_rate": 0.00020732632807939286, "loss": 0.015, "step": 57150 }, { "epoch": 0.62, "learning_rate": 0.00020731011221378996, "loss": 0.0148, "step": 57160 }, { "epoch": 0.62, "learning_rate": 0.00020729389634818705, "loss": 0.0153, "step": 57170 }, { "epoch": 0.62, "learning_rate": 0.00020727768048258414, "loss": 0.0211, "step": 57180 }, { "epoch": 0.62, "learning_rate": 0.00020726146461698123, "loss": 0.0171, "step": 57190 }, { "epoch": 0.62, "learning_rate": 0.00020724524875137833, "loss": 0.0217, "step": 57200 }, { "epoch": 0.62, "learning_rate": 0.00020722903288577545, "loss": 0.018, "step": 57210 }, { "epoch": 0.62, "learning_rate": 0.0002072128170201725, "loss": 0.0161, "step": 57220 }, { "epoch": 0.62, "learning_rate": 0.0002071966011545696, "loss": 0.0159, "step": 57230 }, { "epoch": 0.62, "learning_rate": 0.0002071803852889667, "loss": 0.0137, "step": 57240 }, { "epoch": 0.62, "learning_rate": 0.00020716416942336382, "loss": 0.0175, "step": 57250 }, { "epoch": 0.62, "learning_rate": 0.00020714795355776088, "loss": 0.0156, "step": 57260 }, { "epoch": 0.62, "learning_rate": 0.00020713173769215798, "loss": 0.0164, "step": 57270 }, { "epoch": 0.62, "learning_rate": 0.0002071155218265551, "loss": 0.017, "step": 57280 }, { "epoch": 0.62, "learning_rate": 0.0002070993059609522, "loss": 0.019, "step": 57290 }, { "epoch": 0.62, "learning_rate": 0.00020708309009534925, "loss": 0.0185, "step": 57300 }, { "epoch": 0.62, "learning_rate": 0.00020706687422974635, "loss": 0.0205, "step": 57310 }, { "epoch": 0.62, "learning_rate": 0.00020705065836414347, "loss": 0.0177, "step": 57320 }, { "epoch": 0.62, "learning_rate": 0.00020703444249854056, "loss": 0.0226, "step": 57330 }, { "epoch": 0.62, "learning_rate": 0.00020701822663293763, "loss": 0.0184, "step": 57340 }, { "epoch": 0.62, "learning_rate": 0.00020700201076733474, "loss": 0.0142, "step": 57350 }, { "epoch": 0.62, "learning_rate": 0.00020698579490173184, "loss": 0.019, "step": 57360 }, { "epoch": 0.62, "learning_rate": 0.00020696957903612893, "loss": 0.018, "step": 57370 }, { "epoch": 0.62, "learning_rate": 0.00020695336317052602, "loss": 0.0189, "step": 57380 }, { "epoch": 0.62, "learning_rate": 0.00020693714730492312, "loss": 0.0164, "step": 57390 }, { "epoch": 0.62, "learning_rate": 0.0002069209314393202, "loss": 0.0171, "step": 57400 }, { "epoch": 0.62, "learning_rate": 0.00020690471557371733, "loss": 0.0157, "step": 57410 }, { "epoch": 0.62, "learning_rate": 0.0002068884997081144, "loss": 0.0152, "step": 57420 }, { "epoch": 0.62, "learning_rate": 0.0002068722838425115, "loss": 0.0136, "step": 57430 }, { "epoch": 0.62, "learning_rate": 0.00020685606797690858, "loss": 0.0154, "step": 57440 }, { "epoch": 0.62, "learning_rate": 0.0002068398521113057, "loss": 0.0197, "step": 57450 }, { "epoch": 0.62, "learning_rate": 0.00020682363624570277, "loss": 0.0151, "step": 57460 }, { "epoch": 0.62, "learning_rate": 0.00020680742038009986, "loss": 0.0182, "step": 57470 }, { "epoch": 0.62, "learning_rate": 0.00020679120451449698, "loss": 0.0147, "step": 57480 }, { "epoch": 0.62, "learning_rate": 0.00020677498864889407, "loss": 0.0162, "step": 57490 }, { "epoch": 0.62, "learning_rate": 0.00020675877278329114, "loss": 0.0139, "step": 57500 }, { "epoch": 0.62, "learning_rate": 0.00020674255691768823, "loss": 0.0164, "step": 57510 }, { "epoch": 0.62, "learning_rate": 0.00020672634105208535, "loss": 0.0163, "step": 57520 }, { "epoch": 0.62, "learning_rate": 0.00020671012518648244, "loss": 0.0173, "step": 57530 }, { "epoch": 0.62, "learning_rate": 0.0002066939093208795, "loss": 0.017, "step": 57540 }, { "epoch": 0.62, "learning_rate": 0.00020667769345527663, "loss": 0.0178, "step": 57550 }, { "epoch": 0.62, "learning_rate": 0.00020666147758967372, "loss": 0.0177, "step": 57560 }, { "epoch": 0.62, "learning_rate": 0.0002066452617240708, "loss": 0.014, "step": 57570 }, { "epoch": 0.62, "learning_rate": 0.00020662904585846793, "loss": 0.0195, "step": 57580 }, { "epoch": 0.62, "learning_rate": 0.000206612829992865, "loss": 0.0127, "step": 57590 }, { "epoch": 0.62, "learning_rate": 0.0002065966141272621, "loss": 0.0154, "step": 57600 }, { "epoch": 0.62, "learning_rate": 0.00020658039826165918, "loss": 0.0159, "step": 57610 }, { "epoch": 0.62, "learning_rate": 0.0002065641823960563, "loss": 0.017, "step": 57620 }, { "epoch": 0.62, "learning_rate": 0.00020654796653045337, "loss": 0.0158, "step": 57630 }, { "epoch": 0.62, "learning_rate": 0.00020653175066485046, "loss": 0.0169, "step": 57640 }, { "epoch": 0.62, "learning_rate": 0.00020651553479924758, "loss": 0.0163, "step": 57650 }, { "epoch": 0.62, "learning_rate": 0.00020649931893364467, "loss": 0.0154, "step": 57660 }, { "epoch": 0.62, "learning_rate": 0.00020648310306804174, "loss": 0.0188, "step": 57670 }, { "epoch": 0.62, "learning_rate": 0.00020646688720243886, "loss": 0.0252, "step": 57680 }, { "epoch": 0.62, "learning_rate": 0.00020645067133683595, "loss": 0.0229, "step": 57690 }, { "epoch": 0.62, "learning_rate": 0.00020643445547123305, "loss": 0.0186, "step": 57700 }, { "epoch": 0.62, "learning_rate": 0.0002064182396056301, "loss": 0.0227, "step": 57710 }, { "epoch": 0.62, "learning_rate": 0.00020640202374002723, "loss": 0.0176, "step": 57720 }, { "epoch": 0.62, "learning_rate": 0.00020638580787442432, "loss": 0.0168, "step": 57730 }, { "epoch": 0.62, "learning_rate": 0.00020636959200882142, "loss": 0.0169, "step": 57740 }, { "epoch": 0.62, "learning_rate": 0.0002063533761432185, "loss": 0.0161, "step": 57750 }, { "epoch": 0.62, "learning_rate": 0.0002063371602776156, "loss": 0.0173, "step": 57760 }, { "epoch": 0.62, "learning_rate": 0.0002063209444120127, "loss": 0.0176, "step": 57770 }, { "epoch": 0.62, "learning_rate": 0.00020630472854640981, "loss": 0.0225, "step": 57780 }, { "epoch": 0.62, "learning_rate": 0.00020628851268080688, "loss": 0.0172, "step": 57790 }, { "epoch": 0.62, "learning_rate": 0.00020627229681520397, "loss": 0.0173, "step": 57800 }, { "epoch": 0.62, "learning_rate": 0.00020625608094960107, "loss": 0.0169, "step": 57810 }, { "epoch": 0.63, "learning_rate": 0.00020623986508399819, "loss": 0.0186, "step": 57820 }, { "epoch": 0.63, "learning_rate": 0.00020622364921839525, "loss": 0.0147, "step": 57830 }, { "epoch": 0.63, "learning_rate": 0.00020620743335279234, "loss": 0.0174, "step": 57840 }, { "epoch": 0.63, "learning_rate": 0.00020619121748718946, "loss": 0.0187, "step": 57850 }, { "epoch": 0.63, "learning_rate": 0.00020617500162158656, "loss": 0.0176, "step": 57860 }, { "epoch": 0.63, "learning_rate": 0.00020615878575598362, "loss": 0.0167, "step": 57870 }, { "epoch": 0.63, "learning_rate": 0.00020614256989038071, "loss": 0.0157, "step": 57880 }, { "epoch": 0.63, "learning_rate": 0.00020612635402477783, "loss": 0.0141, "step": 57890 }, { "epoch": 0.63, "learning_rate": 0.00020611013815917493, "loss": 0.0134, "step": 57900 }, { "epoch": 0.63, "learning_rate": 0.000206093922293572, "loss": 0.0149, "step": 57910 }, { "epoch": 0.63, "learning_rate": 0.0002060777064279691, "loss": 0.0184, "step": 57920 }, { "epoch": 0.63, "learning_rate": 0.0002060614905623662, "loss": 0.0132, "step": 57930 }, { "epoch": 0.63, "learning_rate": 0.0002060452746967633, "loss": 0.0153, "step": 57940 }, { "epoch": 0.63, "learning_rate": 0.00020602905883116036, "loss": 0.0151, "step": 57950 }, { "epoch": 0.63, "learning_rate": 0.00020601284296555748, "loss": 0.0182, "step": 57960 }, { "epoch": 0.63, "learning_rate": 0.00020599662709995458, "loss": 0.0175, "step": 57970 }, { "epoch": 0.63, "learning_rate": 0.0002059804112343517, "loss": 0.0189, "step": 57980 }, { "epoch": 0.63, "learning_rate": 0.00020596419536874876, "loss": 0.0142, "step": 57990 }, { "epoch": 0.63, "learning_rate": 0.00020594797950314585, "loss": 0.0182, "step": 58000 }, { "epoch": 0.63, "eval_cer": 0.9215660216421112, "eval_loss": 0.011522618122398853, "eval_runtime": 121.2413, "eval_samples_per_second": 16.496, "eval_steps_per_second": 4.124, "step": 58000 }, { "epoch": 0.63, "learning_rate": 0.00020593176363754295, "loss": 0.0158, "step": 58010 }, { "epoch": 0.63, "learning_rate": 0.00020591554777194007, "loss": 0.0142, "step": 58020 }, { "epoch": 0.63, "learning_rate": 0.00020589933190633713, "loss": 0.0179, "step": 58030 }, { "epoch": 0.63, "learning_rate": 0.00020588311604073423, "loss": 0.0212, "step": 58040 }, { "epoch": 0.63, "learning_rate": 0.00020586690017513135, "loss": 0.0193, "step": 58050 }, { "epoch": 0.63, "learning_rate": 0.00020585068430952844, "loss": 0.0181, "step": 58060 }, { "epoch": 0.63, "learning_rate": 0.0002058344684439255, "loss": 0.0178, "step": 58070 }, { "epoch": 0.63, "learning_rate": 0.0002058182525783226, "loss": 0.0171, "step": 58080 }, { "epoch": 0.63, "learning_rate": 0.00020580203671271972, "loss": 0.0158, "step": 58090 }, { "epoch": 0.63, "learning_rate": 0.0002057858208471168, "loss": 0.0198, "step": 58100 }, { "epoch": 0.63, "learning_rate": 0.00020576960498151387, "loss": 0.0174, "step": 58110 }, { "epoch": 0.63, "learning_rate": 0.000205753389115911, "loss": 0.0188, "step": 58120 }, { "epoch": 0.63, "learning_rate": 0.0002057371732503081, "loss": 0.0168, "step": 58130 }, { "epoch": 0.63, "learning_rate": 0.00020572095738470518, "loss": 0.0125, "step": 58140 }, { "epoch": 0.63, "learning_rate": 0.00020570474151910225, "loss": 0.0185, "step": 58150 }, { "epoch": 0.63, "learning_rate": 0.00020568852565349937, "loss": 0.017, "step": 58160 }, { "epoch": 0.63, "learning_rate": 0.00020567230978789646, "loss": 0.0166, "step": 58170 }, { "epoch": 0.63, "learning_rate": 0.00020565609392229355, "loss": 0.0164, "step": 58180 }, { "epoch": 0.63, "learning_rate": 0.00020563987805669064, "loss": 0.0149, "step": 58190 }, { "epoch": 0.63, "learning_rate": 0.00020562366219108774, "loss": 0.0189, "step": 58200 }, { "epoch": 0.63, "learning_rate": 0.00020560744632548483, "loss": 0.0151, "step": 58210 }, { "epoch": 0.63, "learning_rate": 0.00020559123045988195, "loss": 0.0159, "step": 58220 }, { "epoch": 0.63, "learning_rate": 0.00020557501459427901, "loss": 0.0218, "step": 58230 }, { "epoch": 0.63, "learning_rate": 0.0002055587987286761, "loss": 0.0169, "step": 58240 }, { "epoch": 0.63, "learning_rate": 0.0002055425828630732, "loss": 0.0194, "step": 58250 }, { "epoch": 0.63, "learning_rate": 0.00020552636699747032, "loss": 0.0155, "step": 58260 }, { "epoch": 0.63, "learning_rate": 0.0002055101511318674, "loss": 0.0176, "step": 58270 }, { "epoch": 0.63, "learning_rate": 0.00020549393526626448, "loss": 0.02, "step": 58280 }, { "epoch": 0.63, "learning_rate": 0.0002054777194006616, "loss": 0.0157, "step": 58290 }, { "epoch": 0.63, "learning_rate": 0.0002054615035350587, "loss": 0.0169, "step": 58300 }, { "epoch": 0.63, "learning_rate": 0.00020544528766945578, "loss": 0.0162, "step": 58310 }, { "epoch": 0.63, "learning_rate": 0.00020542907180385285, "loss": 0.0204, "step": 58320 }, { "epoch": 0.63, "learning_rate": 0.00020541285593824997, "loss": 0.0171, "step": 58330 }, { "epoch": 0.63, "learning_rate": 0.00020539664007264706, "loss": 0.0202, "step": 58340 }, { "epoch": 0.63, "learning_rate": 0.00020538042420704418, "loss": 0.0172, "step": 58350 }, { "epoch": 0.63, "learning_rate": 0.00020536420834144125, "loss": 0.0187, "step": 58360 }, { "epoch": 0.63, "learning_rate": 0.00020534799247583834, "loss": 0.0192, "step": 58370 }, { "epoch": 0.63, "learning_rate": 0.00020533177661023543, "loss": 0.0163, "step": 58380 }, { "epoch": 0.63, "learning_rate": 0.00020531556074463255, "loss": 0.0167, "step": 58390 }, { "epoch": 0.63, "learning_rate": 0.00020529934487902962, "loss": 0.0162, "step": 58400 }, { "epoch": 0.63, "learning_rate": 0.0002052831290134267, "loss": 0.0178, "step": 58410 }, { "epoch": 0.63, "learning_rate": 0.00020526691314782383, "loss": 0.0158, "step": 58420 }, { "epoch": 0.63, "learning_rate": 0.00020525069728222092, "loss": 0.0168, "step": 58430 }, { "epoch": 0.63, "learning_rate": 0.000205234481416618, "loss": 0.017, "step": 58440 }, { "epoch": 0.63, "learning_rate": 0.00020521826555101508, "loss": 0.0173, "step": 58450 }, { "epoch": 0.63, "learning_rate": 0.0002052020496854122, "loss": 0.0154, "step": 58460 }, { "epoch": 0.63, "learning_rate": 0.0002051858338198093, "loss": 0.0169, "step": 58470 }, { "epoch": 0.63, "learning_rate": 0.00020516961795420636, "loss": 0.0177, "step": 58480 }, { "epoch": 0.63, "learning_rate": 0.00020515340208860348, "loss": 0.0153, "step": 58490 }, { "epoch": 0.63, "learning_rate": 0.00020513718622300057, "loss": 0.0166, "step": 58500 }, { "epoch": 0.63, "learning_rate": 0.00020512097035739767, "loss": 0.0187, "step": 58510 }, { "epoch": 0.63, "learning_rate": 0.00020510475449179473, "loss": 0.0204, "step": 58520 }, { "epoch": 0.63, "learning_rate": 0.00020508853862619185, "loss": 0.0143, "step": 58530 }, { "epoch": 0.63, "learning_rate": 0.00020507232276058894, "loss": 0.0207, "step": 58540 }, { "epoch": 0.63, "learning_rate": 0.00020505610689498604, "loss": 0.0149, "step": 58550 }, { "epoch": 0.63, "learning_rate": 0.00020503989102938313, "loss": 0.018, "step": 58560 }, { "epoch": 0.63, "learning_rate": 0.00020502367516378022, "loss": 0.0206, "step": 58570 }, { "epoch": 0.63, "learning_rate": 0.00020500745929817732, "loss": 0.0157, "step": 58580 }, { "epoch": 0.63, "learning_rate": 0.00020499124343257443, "loss": 0.0186, "step": 58590 }, { "epoch": 0.63, "learning_rate": 0.0002049750275669715, "loss": 0.0125, "step": 58600 }, { "epoch": 0.63, "learning_rate": 0.0002049588117013686, "loss": 0.0206, "step": 58610 }, { "epoch": 0.63, "learning_rate": 0.00020494259583576569, "loss": 0.0199, "step": 58620 }, { "epoch": 0.63, "learning_rate": 0.0002049263799701628, "loss": 0.0178, "step": 58630 }, { "epoch": 0.63, "learning_rate": 0.00020491016410455987, "loss": 0.0179, "step": 58640 }, { "epoch": 0.63, "learning_rate": 0.00020489394823895696, "loss": 0.0164, "step": 58650 }, { "epoch": 0.63, "learning_rate": 0.00020487773237335408, "loss": 0.0162, "step": 58660 }, { "epoch": 0.63, "learning_rate": 0.00020486151650775118, "loss": 0.014, "step": 58670 }, { "epoch": 0.63, "learning_rate": 0.00020484530064214824, "loss": 0.0197, "step": 58680 }, { "epoch": 0.63, "learning_rate": 0.00020482908477654536, "loss": 0.0146, "step": 58690 }, { "epoch": 0.63, "learning_rate": 0.00020481286891094246, "loss": 0.0142, "step": 58700 }, { "epoch": 0.63, "learning_rate": 0.00020479665304533955, "loss": 0.0161, "step": 58710 }, { "epoch": 0.63, "learning_rate": 0.0002047804371797366, "loss": 0.0182, "step": 58720 }, { "epoch": 0.63, "learning_rate": 0.00020476422131413373, "loss": 0.0181, "step": 58730 }, { "epoch": 0.64, "learning_rate": 0.00020474800544853083, "loss": 0.0198, "step": 58740 }, { "epoch": 0.64, "learning_rate": 0.00020473178958292792, "loss": 0.0167, "step": 58750 }, { "epoch": 0.64, "learning_rate": 0.000204715573717325, "loss": 0.0169, "step": 58760 }, { "epoch": 0.64, "learning_rate": 0.0002046993578517221, "loss": 0.0183, "step": 58770 }, { "epoch": 0.64, "learning_rate": 0.0002046831419861192, "loss": 0.0158, "step": 58780 }, { "epoch": 0.64, "learning_rate": 0.00020466692612051632, "loss": 0.019, "step": 58790 }, { "epoch": 0.64, "learning_rate": 0.00020465071025491338, "loss": 0.017, "step": 58800 }, { "epoch": 0.64, "learning_rate": 0.00020463449438931048, "loss": 0.0175, "step": 58810 }, { "epoch": 0.64, "learning_rate": 0.00020461827852370757, "loss": 0.0204, "step": 58820 }, { "epoch": 0.64, "learning_rate": 0.0002046020626581047, "loss": 0.0181, "step": 58830 }, { "epoch": 0.64, "learning_rate": 0.00020458584679250175, "loss": 0.0139, "step": 58840 }, { "epoch": 0.64, "learning_rate": 0.00020456963092689885, "loss": 0.0165, "step": 58850 }, { "epoch": 0.64, "learning_rate": 0.00020455341506129597, "loss": 0.0171, "step": 58860 }, { "epoch": 0.64, "learning_rate": 0.00020453719919569306, "loss": 0.0161, "step": 58870 }, { "epoch": 0.64, "learning_rate": 0.00020452098333009012, "loss": 0.015, "step": 58880 }, { "epoch": 0.64, "learning_rate": 0.00020450476746448722, "loss": 0.0136, "step": 58890 }, { "epoch": 0.64, "learning_rate": 0.00020448855159888434, "loss": 0.0177, "step": 58900 }, { "epoch": 0.64, "learning_rate": 0.00020447233573328143, "loss": 0.0127, "step": 58910 }, { "epoch": 0.64, "learning_rate": 0.0002044561198676785, "loss": 0.0159, "step": 58920 }, { "epoch": 0.64, "learning_rate": 0.00020443990400207562, "loss": 0.0184, "step": 58930 }, { "epoch": 0.64, "learning_rate": 0.0002044236881364727, "loss": 0.0163, "step": 58940 }, { "epoch": 0.64, "learning_rate": 0.0002044074722708698, "loss": 0.0153, "step": 58950 }, { "epoch": 0.64, "learning_rate": 0.00020439125640526687, "loss": 0.0152, "step": 58960 }, { "epoch": 0.64, "learning_rate": 0.00020437504053966399, "loss": 0.0188, "step": 58970 }, { "epoch": 0.64, "learning_rate": 0.00020435882467406108, "loss": 0.0165, "step": 58980 }, { "epoch": 0.64, "learning_rate": 0.0002043426088084582, "loss": 0.018, "step": 58990 }, { "epoch": 0.64, "learning_rate": 0.0002043263929428553, "loss": 0.0178, "step": 59000 }, { "epoch": 0.64, "eval_cer": 0.9215251973031615, "eval_loss": 0.011170790530741215, "eval_runtime": 121.4022, "eval_samples_per_second": 16.474, "eval_steps_per_second": 4.119, "step": 59000 }, { "epoch": 0.64, "learning_rate": 0.00020431017707725236, "loss": 0.0191, "step": 59010 }, { "epoch": 0.64, "learning_rate": 0.00020429396121164945, "loss": 0.0162, "step": 59020 }, { "epoch": 0.64, "learning_rate": 0.00020427774534604657, "loss": 0.0155, "step": 59030 }, { "epoch": 0.64, "learning_rate": 0.00020426152948044366, "loss": 0.016, "step": 59040 }, { "epoch": 0.64, "learning_rate": 0.00020424531361484073, "loss": 0.0152, "step": 59050 }, { "epoch": 0.64, "learning_rate": 0.00020422909774923785, "loss": 0.0133, "step": 59060 }, { "epoch": 0.64, "learning_rate": 0.00020421288188363494, "loss": 0.0162, "step": 59070 }, { "epoch": 0.64, "learning_rate": 0.00020419666601803203, "loss": 0.0147, "step": 59080 }, { "epoch": 0.64, "learning_rate": 0.0002041804501524291, "loss": 0.0173, "step": 59090 }, { "epoch": 0.64, "learning_rate": 0.00020416423428682622, "loss": 0.0154, "step": 59100 }, { "epoch": 0.64, "learning_rate": 0.0002041480184212233, "loss": 0.0186, "step": 59110 }, { "epoch": 0.64, "learning_rate": 0.0002041318025556204, "loss": 0.015, "step": 59120 }, { "epoch": 0.64, "learning_rate": 0.0002041155866900175, "loss": 0.0161, "step": 59130 }, { "epoch": 0.64, "learning_rate": 0.0002040993708244146, "loss": 0.0185, "step": 59140 }, { "epoch": 0.64, "learning_rate": 0.00020408315495881168, "loss": 0.0159, "step": 59150 }, { "epoch": 0.64, "learning_rate": 0.0002040669390932088, "loss": 0.0169, "step": 59160 }, { "epoch": 0.64, "learning_rate": 0.00020405072322760587, "loss": 0.0147, "step": 59170 }, { "epoch": 0.64, "learning_rate": 0.00020403450736200296, "loss": 0.0162, "step": 59180 }, { "epoch": 0.64, "learning_rate": 0.00020401829149640005, "loss": 0.015, "step": 59190 }, { "epoch": 0.64, "learning_rate": 0.00020400207563079717, "loss": 0.019, "step": 59200 }, { "epoch": 0.64, "learning_rate": 0.00020398585976519424, "loss": 0.0177, "step": 59210 }, { "epoch": 0.64, "learning_rate": 0.00020396964389959133, "loss": 0.0147, "step": 59220 }, { "epoch": 0.64, "learning_rate": 0.00020395342803398845, "loss": 0.0172, "step": 59230 }, { "epoch": 0.64, "learning_rate": 0.00020393721216838554, "loss": 0.0194, "step": 59240 }, { "epoch": 0.64, "learning_rate": 0.0002039209963027826, "loss": 0.0152, "step": 59250 }, { "epoch": 0.64, "learning_rate": 0.0002039047804371797, "loss": 0.0149, "step": 59260 }, { "epoch": 0.64, "learning_rate": 0.00020388856457157682, "loss": 0.0146, "step": 59270 }, { "epoch": 0.64, "learning_rate": 0.00020387234870597392, "loss": 0.0141, "step": 59280 }, { "epoch": 0.64, "learning_rate": 0.00020385613284037098, "loss": 0.0174, "step": 59290 }, { "epoch": 0.64, "learning_rate": 0.0002038399169747681, "loss": 0.0147, "step": 59300 }, { "epoch": 0.64, "learning_rate": 0.0002038237011091652, "loss": 0.0182, "step": 59310 }, { "epoch": 0.64, "learning_rate": 0.0002038074852435623, "loss": 0.0186, "step": 59320 }, { "epoch": 0.64, "learning_rate": 0.00020379126937795935, "loss": 0.0163, "step": 59330 }, { "epoch": 0.64, "learning_rate": 0.00020377505351235647, "loss": 0.0157, "step": 59340 }, { "epoch": 0.64, "learning_rate": 0.00020375883764675356, "loss": 0.0156, "step": 59350 }, { "epoch": 0.64, "learning_rate": 0.00020374262178115068, "loss": 0.0131, "step": 59360 }, { "epoch": 0.64, "learning_rate": 0.00020372640591554775, "loss": 0.0169, "step": 59370 }, { "epoch": 0.64, "learning_rate": 0.00020371019004994484, "loss": 0.0181, "step": 59380 }, { "epoch": 0.64, "learning_rate": 0.00020369397418434194, "loss": 0.0313, "step": 59390 }, { "epoch": 0.64, "learning_rate": 0.00020367775831873906, "loss": 0.0281, "step": 59400 }, { "epoch": 0.64, "learning_rate": 0.00020366154245313612, "loss": 0.0155, "step": 59410 }, { "epoch": 0.64, "learning_rate": 0.00020364532658753321, "loss": 0.0154, "step": 59420 }, { "epoch": 0.64, "learning_rate": 0.00020362911072193033, "loss": 0.0147, "step": 59430 }, { "epoch": 0.64, "learning_rate": 0.00020361289485632743, "loss": 0.0164, "step": 59440 }, { "epoch": 0.64, "learning_rate": 0.0002035966789907245, "loss": 0.0145, "step": 59450 }, { "epoch": 0.64, "learning_rate": 0.00020358046312512158, "loss": 0.0197, "step": 59460 }, { "epoch": 0.64, "learning_rate": 0.0002035642472595187, "loss": 0.0164, "step": 59470 }, { "epoch": 0.64, "learning_rate": 0.0002035480313939158, "loss": 0.0159, "step": 59480 }, { "epoch": 0.64, "learning_rate": 0.00020353181552831286, "loss": 0.0182, "step": 59490 }, { "epoch": 0.64, "learning_rate": 0.00020351559966270998, "loss": 0.0197, "step": 59500 }, { "epoch": 0.64, "learning_rate": 0.00020349938379710708, "loss": 0.017, "step": 59510 }, { "epoch": 0.64, "learning_rate": 0.00020348316793150417, "loss": 0.0165, "step": 59520 }, { "epoch": 0.64, "learning_rate": 0.00020346695206590123, "loss": 0.0179, "step": 59530 }, { "epoch": 0.64, "learning_rate": 0.00020345073620029835, "loss": 0.0136, "step": 59540 }, { "epoch": 0.64, "learning_rate": 0.00020343452033469545, "loss": 0.017, "step": 59550 }, { "epoch": 0.64, "learning_rate": 0.00020341830446909254, "loss": 0.0172, "step": 59560 }, { "epoch": 0.64, "learning_rate": 0.00020340208860348963, "loss": 0.0152, "step": 59570 }, { "epoch": 0.64, "learning_rate": 0.00020338587273788672, "loss": 0.0148, "step": 59580 }, { "epoch": 0.64, "learning_rate": 0.00020336965687228382, "loss": 0.0176, "step": 59590 }, { "epoch": 0.64, "learning_rate": 0.00020335344100668094, "loss": 0.0169, "step": 59600 }, { "epoch": 0.64, "learning_rate": 0.000203337225141078, "loss": 0.0179, "step": 59610 }, { "epoch": 0.64, "learning_rate": 0.0002033210092754751, "loss": 0.012, "step": 59620 }, { "epoch": 0.64, "learning_rate": 0.0002033047934098722, "loss": 0.0161, "step": 59630 }, { "epoch": 0.64, "learning_rate": 0.0002032885775442693, "loss": 0.0165, "step": 59640 }, { "epoch": 0.64, "learning_rate": 0.00020327236167866637, "loss": 0.0212, "step": 59650 }, { "epoch": 0.64, "learning_rate": 0.00020325614581306347, "loss": 0.0132, "step": 59660 }, { "epoch": 0.65, "learning_rate": 0.0002032399299474606, "loss": 0.0148, "step": 59670 }, { "epoch": 0.65, "learning_rate": 0.00020322371408185768, "loss": 0.0179, "step": 59680 }, { "epoch": 0.65, "learning_rate": 0.00020320749821625475, "loss": 0.0143, "step": 59690 }, { "epoch": 0.65, "learning_rate": 0.00020319128235065186, "loss": 0.0136, "step": 59700 }, { "epoch": 0.65, "learning_rate": 0.00020317506648504896, "loss": 0.0162, "step": 59710 }, { "epoch": 0.65, "learning_rate": 0.00020315885061944605, "loss": 0.0148, "step": 59720 }, { "epoch": 0.65, "learning_rate": 0.00020314263475384317, "loss": 0.0161, "step": 59730 }, { "epoch": 0.65, "learning_rate": 0.00020312641888824024, "loss": 0.0138, "step": 59740 }, { "epoch": 0.65, "learning_rate": 0.00020311020302263733, "loss": 0.0162, "step": 59750 }, { "epoch": 0.65, "learning_rate": 0.00020309398715703442, "loss": 0.0164, "step": 59760 }, { "epoch": 0.65, "learning_rate": 0.00020307777129143154, "loss": 0.0163, "step": 59770 }, { "epoch": 0.65, "learning_rate": 0.0002030615554258286, "loss": 0.015, "step": 59780 }, { "epoch": 0.65, "learning_rate": 0.0002030453395602257, "loss": 0.0174, "step": 59790 }, { "epoch": 0.65, "learning_rate": 0.00020302912369462282, "loss": 0.0153, "step": 59800 }, { "epoch": 0.65, "learning_rate": 0.0002030129078290199, "loss": 0.0181, "step": 59810 }, { "epoch": 0.65, "learning_rate": 0.00020299669196341698, "loss": 0.0139, "step": 59820 }, { "epoch": 0.65, "learning_rate": 0.00020298047609781407, "loss": 0.015, "step": 59830 }, { "epoch": 0.65, "learning_rate": 0.0002029642602322112, "loss": 0.0142, "step": 59840 }, { "epoch": 0.65, "learning_rate": 0.00020294804436660828, "loss": 0.0172, "step": 59850 }, { "epoch": 0.65, "learning_rate": 0.00020293182850100535, "loss": 0.0166, "step": 59860 }, { "epoch": 0.65, "learning_rate": 0.00020291561263540247, "loss": 0.0185, "step": 59870 }, { "epoch": 0.65, "learning_rate": 0.00020289939676979956, "loss": 0.0172, "step": 59880 }, { "epoch": 0.65, "learning_rate": 0.00020288318090419665, "loss": 0.0191, "step": 59890 }, { "epoch": 0.65, "learning_rate": 0.00020286696503859372, "loss": 0.0179, "step": 59900 }, { "epoch": 0.65, "learning_rate": 0.00020285074917299084, "loss": 0.0148, "step": 59910 }, { "epoch": 0.65, "learning_rate": 0.00020283453330738793, "loss": 0.0133, "step": 59920 }, { "epoch": 0.65, "learning_rate": 0.00020281831744178505, "loss": 0.0153, "step": 59930 }, { "epoch": 0.65, "learning_rate": 0.00020280210157618212, "loss": 0.016, "step": 59940 }, { "epoch": 0.65, "learning_rate": 0.0002027858857105792, "loss": 0.0147, "step": 59950 }, { "epoch": 0.65, "learning_rate": 0.0002027696698449763, "loss": 0.0164, "step": 59960 }, { "epoch": 0.65, "learning_rate": 0.00020275345397937342, "loss": 0.0176, "step": 59970 }, { "epoch": 0.65, "learning_rate": 0.0002027372381137705, "loss": 0.0186, "step": 59980 }, { "epoch": 0.65, "learning_rate": 0.00020272102224816758, "loss": 0.0129, "step": 59990 }, { "epoch": 0.65, "learning_rate": 0.0002027048063825647, "loss": 0.0187, "step": 60000 }, { "epoch": 0.65, "eval_cer": 0.9215121682588159, "eval_loss": 0.01132188830524683, "eval_runtime": 121.508, "eval_samples_per_second": 16.46, "eval_steps_per_second": 4.115, "step": 60000 }, { "epoch": 0.65, "learning_rate": 0.0002026885905169618, "loss": 0.0149, "step": 60010 }, { "epoch": 0.65, "learning_rate": 0.00020267237465135886, "loss": 0.0151, "step": 60020 }, { "epoch": 0.65, "learning_rate": 0.00020265615878575595, "loss": 0.0162, "step": 60030 }, { "epoch": 0.65, "learning_rate": 0.00020263994292015307, "loss": 0.02, "step": 60040 }, { "epoch": 0.65, "learning_rate": 0.00020262372705455017, "loss": 0.0149, "step": 60050 }, { "epoch": 0.65, "learning_rate": 0.00020260751118894723, "loss": 0.0179, "step": 60060 }, { "epoch": 0.65, "learning_rate": 0.00020259129532334435, "loss": 0.0158, "step": 60070 }, { "epoch": 0.65, "learning_rate": 0.00020257507945774144, "loss": 0.0161, "step": 60080 }, { "epoch": 0.65, "learning_rate": 0.00020255886359213854, "loss": 0.0151, "step": 60090 }, { "epoch": 0.65, "learning_rate": 0.0002025426477265356, "loss": 0.0163, "step": 60100 }, { "epoch": 0.65, "learning_rate": 0.00020252643186093272, "loss": 0.0131, "step": 60110 }, { "epoch": 0.65, "learning_rate": 0.00020251021599532981, "loss": 0.0151, "step": 60120 }, { "epoch": 0.65, "learning_rate": 0.0002024940001297269, "loss": 0.0161, "step": 60130 }, { "epoch": 0.65, "learning_rate": 0.000202477784264124, "loss": 0.0159, "step": 60140 }, { "epoch": 0.65, "learning_rate": 0.0002024615683985211, "loss": 0.0139, "step": 60150 }, { "epoch": 0.65, "learning_rate": 0.00020244535253291819, "loss": 0.0156, "step": 60160 }, { "epoch": 0.65, "learning_rate": 0.0002024291366673153, "loss": 0.0183, "step": 60170 }, { "epoch": 0.65, "learning_rate": 0.00020241292080171237, "loss": 0.0179, "step": 60180 }, { "epoch": 0.65, "learning_rate": 0.00020239670493610946, "loss": 0.0133, "step": 60190 }, { "epoch": 0.65, "learning_rate": 0.00020238048907050656, "loss": 0.0172, "step": 60200 }, { "epoch": 0.65, "learning_rate": 0.00020236427320490368, "loss": 0.0171, "step": 60210 }, { "epoch": 0.65, "learning_rate": 0.00020234805733930074, "loss": 0.014, "step": 60220 }, { "epoch": 0.65, "learning_rate": 0.00020233184147369783, "loss": 0.0165, "step": 60230 }, { "epoch": 0.65, "learning_rate": 0.00020231562560809495, "loss": 0.0152, "step": 60240 }, { "epoch": 0.65, "learning_rate": 0.00020229940974249205, "loss": 0.016, "step": 60250 }, { "epoch": 0.65, "learning_rate": 0.0002022831938768891, "loss": 0.017, "step": 60260 }, { "epoch": 0.65, "learning_rate": 0.0002022669780112862, "loss": 0.0137, "step": 60270 }, { "epoch": 0.65, "learning_rate": 0.00020225076214568333, "loss": 0.0151, "step": 60280 }, { "epoch": 0.65, "learning_rate": 0.00020223454628008042, "loss": 0.0163, "step": 60290 }, { "epoch": 0.65, "learning_rate": 0.00020221833041447748, "loss": 0.0156, "step": 60300 }, { "epoch": 0.65, "learning_rate": 0.0002022021145488746, "loss": 0.0169, "step": 60310 }, { "epoch": 0.65, "learning_rate": 0.0002021858986832717, "loss": 0.0149, "step": 60320 }, { "epoch": 0.65, "learning_rate": 0.0002021696828176688, "loss": 0.0135, "step": 60330 }, { "epoch": 0.65, "learning_rate": 0.00020215346695206585, "loss": 0.0165, "step": 60340 }, { "epoch": 0.65, "learning_rate": 0.00020213725108646297, "loss": 0.0136, "step": 60350 }, { "epoch": 0.65, "learning_rate": 0.00020212103522086007, "loss": 0.0148, "step": 60360 }, { "epoch": 0.65, "learning_rate": 0.0002021048193552572, "loss": 0.0156, "step": 60370 }, { "epoch": 0.65, "learning_rate": 0.00020208860348965425, "loss": 0.019, "step": 60380 }, { "epoch": 0.65, "learning_rate": 0.00020207238762405135, "loss": 0.014, "step": 60390 }, { "epoch": 0.65, "learning_rate": 0.00020205617175844844, "loss": 0.0144, "step": 60400 }, { "epoch": 0.65, "learning_rate": 0.00020203995589284556, "loss": 0.0153, "step": 60410 }, { "epoch": 0.65, "learning_rate": 0.00020202374002724262, "loss": 0.0148, "step": 60420 }, { "epoch": 0.65, "learning_rate": 0.00020200752416163972, "loss": 0.0181, "step": 60430 }, { "epoch": 0.65, "learning_rate": 0.00020199130829603684, "loss": 0.0156, "step": 60440 }, { "epoch": 0.65, "learning_rate": 0.00020197509243043393, "loss": 0.0164, "step": 60450 }, { "epoch": 0.65, "learning_rate": 0.00020195887656483102, "loss": 0.0158, "step": 60460 }, { "epoch": 0.65, "learning_rate": 0.0002019426606992281, "loss": 0.0153, "step": 60470 }, { "epoch": 0.65, "learning_rate": 0.0002019264448336252, "loss": 0.0148, "step": 60480 }, { "epoch": 0.65, "learning_rate": 0.0002019102289680223, "loss": 0.0125, "step": 60490 }, { "epoch": 0.65, "learning_rate": 0.0002018940131024194, "loss": 0.016, "step": 60500 }, { "epoch": 0.65, "learning_rate": 0.00020187779723681649, "loss": 0.0138, "step": 60510 }, { "epoch": 0.65, "learning_rate": 0.00020186158137121358, "loss": 0.0159, "step": 60520 }, { "epoch": 0.65, "learning_rate": 0.00020184536550561067, "loss": 0.0164, "step": 60530 }, { "epoch": 0.65, "learning_rate": 0.0002018291496400078, "loss": 0.0168, "step": 60540 }, { "epoch": 0.65, "learning_rate": 0.00020181293377440486, "loss": 0.0202, "step": 60550 }, { "epoch": 0.65, "learning_rate": 0.00020179671790880195, "loss": 0.0151, "step": 60560 }, { "epoch": 0.65, "learning_rate": 0.00020178050204319904, "loss": 0.0166, "step": 60570 }, { "epoch": 0.65, "learning_rate": 0.00020176428617759616, "loss": 0.0163, "step": 60580 }, { "epoch": 0.66, "learning_rate": 0.00020174807031199323, "loss": 0.0164, "step": 60590 }, { "epoch": 0.66, "learning_rate": 0.00020173185444639032, "loss": 0.0152, "step": 60600 }, { "epoch": 0.66, "learning_rate": 0.00020171563858078744, "loss": 0.0167, "step": 60610 }, { "epoch": 0.66, "learning_rate": 0.00020169942271518453, "loss": 0.0155, "step": 60620 }, { "epoch": 0.66, "learning_rate": 0.0002016832068495816, "loss": 0.0175, "step": 60630 }, { "epoch": 0.66, "learning_rate": 0.0002016669909839787, "loss": 0.0185, "step": 60640 }, { "epoch": 0.66, "learning_rate": 0.0002016507751183758, "loss": 0.0147, "step": 60650 }, { "epoch": 0.66, "learning_rate": 0.0002016345592527729, "loss": 0.021, "step": 60660 }, { "epoch": 0.66, "learning_rate": 0.00020161834338716997, "loss": 0.0219, "step": 60670 }, { "epoch": 0.66, "learning_rate": 0.0002016021275215671, "loss": 0.0143, "step": 60680 }, { "epoch": 0.66, "learning_rate": 0.00020158591165596418, "loss": 0.0161, "step": 60690 }, { "epoch": 0.66, "learning_rate": 0.00020156969579036127, "loss": 0.0173, "step": 60700 }, { "epoch": 0.66, "learning_rate": 0.00020155347992475837, "loss": 0.0171, "step": 60710 }, { "epoch": 0.66, "learning_rate": 0.00020153726405915546, "loss": 0.0175, "step": 60720 }, { "epoch": 0.66, "learning_rate": 0.00020152104819355255, "loss": 0.015, "step": 60730 }, { "epoch": 0.66, "learning_rate": 0.00020150483232794967, "loss": 0.0174, "step": 60740 }, { "epoch": 0.66, "learning_rate": 0.00020148861646234674, "loss": 0.0163, "step": 60750 }, { "epoch": 0.66, "learning_rate": 0.00020147240059674383, "loss": 0.0154, "step": 60760 }, { "epoch": 0.66, "learning_rate": 0.00020145618473114092, "loss": 0.0198, "step": 60770 }, { "epoch": 0.66, "learning_rate": 0.00020143996886553804, "loss": 0.0174, "step": 60780 }, { "epoch": 0.66, "learning_rate": 0.0002014237529999351, "loss": 0.0156, "step": 60790 }, { "epoch": 0.66, "learning_rate": 0.0002014075371343322, "loss": 0.0165, "step": 60800 }, { "epoch": 0.66, "learning_rate": 0.00020139132126872932, "loss": 0.0144, "step": 60810 }, { "epoch": 0.66, "learning_rate": 0.00020137510540312641, "loss": 0.0177, "step": 60820 }, { "epoch": 0.66, "learning_rate": 0.00020135888953752348, "loss": 0.014, "step": 60830 }, { "epoch": 0.66, "learning_rate": 0.00020134267367192057, "loss": 0.0158, "step": 60840 }, { "epoch": 0.66, "learning_rate": 0.0002013264578063177, "loss": 0.0146, "step": 60850 }, { "epoch": 0.66, "learning_rate": 0.00020131024194071479, "loss": 0.0173, "step": 60860 }, { "epoch": 0.66, "learning_rate": 0.00020129402607511185, "loss": 0.0155, "step": 60870 }, { "epoch": 0.66, "learning_rate": 0.00020127781020950897, "loss": 0.0189, "step": 60880 }, { "epoch": 0.66, "learning_rate": 0.00020126159434390606, "loss": 0.019, "step": 60890 }, { "epoch": 0.66, "learning_rate": 0.00020124537847830316, "loss": 0.0156, "step": 60900 }, { "epoch": 0.66, "learning_rate": 0.00020122916261270022, "loss": 0.015, "step": 60910 }, { "epoch": 0.66, "learning_rate": 0.00020121294674709734, "loss": 0.0185, "step": 60920 }, { "epoch": 0.66, "learning_rate": 0.00020119673088149444, "loss": 0.0186, "step": 60930 }, { "epoch": 0.66, "learning_rate": 0.00020118051501589155, "loss": 0.017, "step": 60940 }, { "epoch": 0.66, "learning_rate": 0.00020116429915028862, "loss": 0.0219, "step": 60950 }, { "epoch": 0.66, "learning_rate": 0.0002011480832846857, "loss": 0.0143, "step": 60960 }, { "epoch": 0.66, "learning_rate": 0.0002011318674190828, "loss": 0.0164, "step": 60970 }, { "epoch": 0.66, "learning_rate": 0.00020111565155347993, "loss": 0.016, "step": 60980 }, { "epoch": 0.66, "learning_rate": 0.000201099435687877, "loss": 0.0177, "step": 60990 }, { "epoch": 0.66, "learning_rate": 0.00020108321982227408, "loss": 0.0174, "step": 61000 }, { "epoch": 0.66, "eval_cer": 0.9215981599514972, "eval_loss": 0.011921165511012077, "eval_runtime": 121.5349, "eval_samples_per_second": 16.456, "eval_steps_per_second": 4.114, "step": 61000 }, { "epoch": 0.66, "learning_rate": 0.0002010670039566712, "loss": 0.0148, "step": 61010 }, { "epoch": 0.66, "learning_rate": 0.0002010507880910683, "loss": 0.0161, "step": 61020 }, { "epoch": 0.66, "learning_rate": 0.00020103457222546536, "loss": 0.0206, "step": 61030 }, { "epoch": 0.66, "learning_rate": 0.00020101835635986246, "loss": 0.0157, "step": 61040 }, { "epoch": 0.66, "learning_rate": 0.00020100214049425958, "loss": 0.0165, "step": 61050 }, { "epoch": 0.66, "learning_rate": 0.00020098592462865667, "loss": 0.014, "step": 61060 }, { "epoch": 0.66, "learning_rate": 0.00020096970876305373, "loss": 0.0158, "step": 61070 }, { "epoch": 0.66, "learning_rate": 0.00020095349289745085, "loss": 0.0135, "step": 61080 }, { "epoch": 0.66, "learning_rate": 0.00020093727703184795, "loss": 0.0166, "step": 61090 }, { "epoch": 0.66, "learning_rate": 0.00020092106116624504, "loss": 0.0236, "step": 61100 }, { "epoch": 0.66, "learning_rate": 0.0002009048453006421, "loss": 0.0185, "step": 61110 }, { "epoch": 0.66, "learning_rate": 0.00020088862943503922, "loss": 0.013, "step": 61120 }, { "epoch": 0.66, "learning_rate": 0.00020087241356943632, "loss": 0.0163, "step": 61130 }, { "epoch": 0.66, "learning_rate": 0.0002008561977038334, "loss": 0.0171, "step": 61140 }, { "epoch": 0.66, "learning_rate": 0.00020083998183823053, "loss": 0.0207, "step": 61150 }, { "epoch": 0.66, "learning_rate": 0.0002008237659726276, "loss": 0.0166, "step": 61160 }, { "epoch": 0.66, "learning_rate": 0.0002008075501070247, "loss": 0.0156, "step": 61170 }, { "epoch": 0.66, "learning_rate": 0.0002007913342414218, "loss": 0.0174, "step": 61180 }, { "epoch": 0.66, "learning_rate": 0.0002007751183758189, "loss": 0.0159, "step": 61190 }, { "epoch": 0.66, "learning_rate": 0.00020075890251021597, "loss": 0.015, "step": 61200 }, { "epoch": 0.66, "learning_rate": 0.00020074268664461306, "loss": 0.0173, "step": 61210 }, { "epoch": 0.66, "learning_rate": 0.00020072647077901018, "loss": 0.0185, "step": 61220 }, { "epoch": 0.66, "learning_rate": 0.00020071025491340727, "loss": 0.017, "step": 61230 }, { "epoch": 0.66, "learning_rate": 0.00020069403904780434, "loss": 0.0169, "step": 61240 }, { "epoch": 0.66, "learning_rate": 0.00020067782318220146, "loss": 0.0177, "step": 61250 }, { "epoch": 0.66, "learning_rate": 0.00020066160731659855, "loss": 0.0166, "step": 61260 }, { "epoch": 0.66, "learning_rate": 0.00020064539145099564, "loss": 0.0177, "step": 61270 }, { "epoch": 0.66, "learning_rate": 0.0002006291755853927, "loss": 0.0165, "step": 61280 }, { "epoch": 0.66, "learning_rate": 0.00020061295971978983, "loss": 0.0156, "step": 61290 }, { "epoch": 0.66, "learning_rate": 0.00020059674385418692, "loss": 0.0159, "step": 61300 }, { "epoch": 0.66, "learning_rate": 0.00020058052798858404, "loss": 0.0155, "step": 61310 }, { "epoch": 0.66, "learning_rate": 0.0002005643121229811, "loss": 0.0166, "step": 61320 }, { "epoch": 0.66, "learning_rate": 0.0002005480962573782, "loss": 0.0168, "step": 61330 }, { "epoch": 0.66, "learning_rate": 0.0002005318803917753, "loss": 0.0172, "step": 61340 }, { "epoch": 0.66, "learning_rate": 0.0002005156645261724, "loss": 0.016, "step": 61350 }, { "epoch": 0.66, "learning_rate": 0.00020049944866056948, "loss": 0.0153, "step": 61360 }, { "epoch": 0.66, "learning_rate": 0.00020048323279496657, "loss": 0.0178, "step": 61370 }, { "epoch": 0.66, "learning_rate": 0.0002004670169293637, "loss": 0.0151, "step": 61380 }, { "epoch": 0.66, "learning_rate": 0.00020045080106376078, "loss": 0.0186, "step": 61390 }, { "epoch": 0.66, "learning_rate": 0.00020043458519815785, "loss": 0.0211, "step": 61400 }, { "epoch": 0.66, "learning_rate": 0.00020041836933255494, "loss": 0.0134, "step": 61410 }, { "epoch": 0.66, "learning_rate": 0.00020040215346695206, "loss": 0.0131, "step": 61420 }, { "epoch": 0.66, "learning_rate": 0.00020038593760134915, "loss": 0.0142, "step": 61430 }, { "epoch": 0.66, "learning_rate": 0.00020036972173574622, "loss": 0.0177, "step": 61440 }, { "epoch": 0.66, "learning_rate": 0.00020035350587014334, "loss": 0.016, "step": 61450 }, { "epoch": 0.66, "learning_rate": 0.00020033729000454043, "loss": 0.0143, "step": 61460 }, { "epoch": 0.66, "learning_rate": 0.00020032107413893752, "loss": 0.0144, "step": 61470 }, { "epoch": 0.66, "learning_rate": 0.0002003048582733346, "loss": 0.0172, "step": 61480 }, { "epoch": 0.66, "learning_rate": 0.0002002886424077317, "loss": 0.0162, "step": 61490 }, { "epoch": 0.66, "learning_rate": 0.0002002724265421288, "loss": 0.0138, "step": 61500 }, { "epoch": 0.66, "learning_rate": 0.0002002562106765259, "loss": 0.0173, "step": 61510 }, { "epoch": 0.67, "learning_rate": 0.000200239994810923, "loss": 0.016, "step": 61520 }, { "epoch": 0.67, "learning_rate": 0.00020022377894532008, "loss": 0.0146, "step": 61530 }, { "epoch": 0.67, "learning_rate": 0.00020020756307971717, "loss": 0.0162, "step": 61540 }, { "epoch": 0.67, "learning_rate": 0.0002001913472141143, "loss": 0.0158, "step": 61550 }, { "epoch": 0.67, "learning_rate": 0.00020017513134851136, "loss": 0.0162, "step": 61560 }, { "epoch": 0.67, "learning_rate": 0.00020015891548290845, "loss": 0.0227, "step": 61570 }, { "epoch": 0.67, "learning_rate": 0.00020014269961730554, "loss": 0.0152, "step": 61580 }, { "epoch": 0.67, "learning_rate": 0.00020012648375170266, "loss": 0.0166, "step": 61590 }, { "epoch": 0.67, "learning_rate": 0.00020011026788609973, "loss": 0.015, "step": 61600 }, { "epoch": 0.67, "learning_rate": 0.00020009405202049682, "loss": 0.0146, "step": 61610 }, { "epoch": 0.67, "learning_rate": 0.00020007783615489394, "loss": 0.0159, "step": 61620 }, { "epoch": 0.67, "learning_rate": 0.00020006162028929104, "loss": 0.0206, "step": 61630 }, { "epoch": 0.67, "learning_rate": 0.0002000454044236881, "loss": 0.0178, "step": 61640 }, { "epoch": 0.67, "learning_rate": 0.0002000291885580852, "loss": 0.0178, "step": 61650 }, { "epoch": 0.67, "learning_rate": 0.00020001297269248231, "loss": 0.0202, "step": 61660 }, { "epoch": 0.67, "learning_rate": 0.0001999967568268794, "loss": 0.0178, "step": 61670 }, { "epoch": 0.67, "learning_rate": 0.00019998054096127647, "loss": 0.0149, "step": 61680 }, { "epoch": 0.67, "learning_rate": 0.0001999643250956736, "loss": 0.0155, "step": 61690 }, { "epoch": 0.67, "learning_rate": 0.00019994810923007068, "loss": 0.0187, "step": 61700 }, { "epoch": 0.67, "learning_rate": 0.00019993189336446778, "loss": 0.0189, "step": 61710 }, { "epoch": 0.67, "learning_rate": 0.00019991567749886487, "loss": 0.018, "step": 61720 }, { "epoch": 0.67, "learning_rate": 0.00019989946163326196, "loss": 0.0151, "step": 61730 }, { "epoch": 0.67, "learning_rate": 0.00019988324576765906, "loss": 0.0145, "step": 61740 }, { "epoch": 0.67, "learning_rate": 0.00019986702990205618, "loss": 0.0183, "step": 61750 }, { "epoch": 0.67, "learning_rate": 0.00019985081403645324, "loss": 0.0186, "step": 61760 }, { "epoch": 0.67, "learning_rate": 0.00019983459817085033, "loss": 0.0194, "step": 61770 }, { "epoch": 0.67, "learning_rate": 0.00019981838230524743, "loss": 0.0134, "step": 61780 }, { "epoch": 0.67, "learning_rate": 0.00019980216643964455, "loss": 0.016, "step": 61790 }, { "epoch": 0.67, "learning_rate": 0.0001997859505740416, "loss": 0.0146, "step": 61800 }, { "epoch": 0.67, "learning_rate": 0.0001997697347084387, "loss": 0.0166, "step": 61810 }, { "epoch": 0.67, "learning_rate": 0.00019975351884283582, "loss": 0.0149, "step": 61820 }, { "epoch": 0.67, "learning_rate": 0.00019973730297723292, "loss": 0.0149, "step": 61830 }, { "epoch": 0.67, "learning_rate": 0.00019972108711162998, "loss": 0.0146, "step": 61840 }, { "epoch": 0.67, "learning_rate": 0.00019970487124602708, "loss": 0.0161, "step": 61850 }, { "epoch": 0.67, "learning_rate": 0.0001996886553804242, "loss": 0.0162, "step": 61860 }, { "epoch": 0.67, "learning_rate": 0.0001996724395148213, "loss": 0.0176, "step": 61870 }, { "epoch": 0.67, "learning_rate": 0.00019965622364921838, "loss": 0.0153, "step": 61880 }, { "epoch": 0.67, "learning_rate": 0.00019964000778361547, "loss": 0.0192, "step": 61890 }, { "epoch": 0.67, "learning_rate": 0.00019962379191801257, "loss": 0.0172, "step": 61900 }, { "epoch": 0.67, "learning_rate": 0.00019960757605240966, "loss": 0.0192, "step": 61910 }, { "epoch": 0.67, "learning_rate": 0.00019959136018680678, "loss": 0.019, "step": 61920 }, { "epoch": 0.67, "learning_rate": 0.00019957514432120384, "loss": 0.0159, "step": 61930 }, { "epoch": 0.67, "learning_rate": 0.00019955892845560094, "loss": 0.016, "step": 61940 }, { "epoch": 0.67, "learning_rate": 0.00019954271258999803, "loss": 0.0149, "step": 61950 }, { "epoch": 0.67, "learning_rate": 0.00019952649672439515, "loss": 0.0162, "step": 61960 }, { "epoch": 0.67, "learning_rate": 0.00019951028085879222, "loss": 0.0183, "step": 61970 }, { "epoch": 0.67, "learning_rate": 0.0001994940649931893, "loss": 0.0186, "step": 61980 }, { "epoch": 0.67, "learning_rate": 0.00019947784912758643, "loss": 0.0201, "step": 61990 }, { "epoch": 0.67, "learning_rate": 0.00019946163326198352, "loss": 0.0135, "step": 62000 }, { "epoch": 0.67, "eval_cer": 0.9215330147297689, "eval_loss": 0.011450623162090778, "eval_runtime": 121.258, "eval_samples_per_second": 16.494, "eval_steps_per_second": 4.123, "step": 62000 }, { "epoch": 0.67, "learning_rate": 0.0001994454173963806, "loss": 0.0175, "step": 62010 }, { "epoch": 0.67, "learning_rate": 0.0001994292015307777, "loss": 0.0172, "step": 62020 }, { "epoch": 0.67, "learning_rate": 0.0001994129856651748, "loss": 0.0146, "step": 62030 }, { "epoch": 0.67, "learning_rate": 0.0001993967697995719, "loss": 0.0421, "step": 62040 }, { "epoch": 0.67, "learning_rate": 0.00019938055393396896, "loss": 0.0281, "step": 62050 }, { "epoch": 0.67, "learning_rate": 0.00019936433806836608, "loss": 0.0206, "step": 62060 }, { "epoch": 0.67, "learning_rate": 0.00019934812220276317, "loss": 0.0181, "step": 62070 }, { "epoch": 0.67, "learning_rate": 0.00019933190633716026, "loss": 0.0183, "step": 62080 }, { "epoch": 0.67, "learning_rate": 0.00019931569047155736, "loss": 0.0212, "step": 62090 }, { "epoch": 0.67, "learning_rate": 0.00019929947460595445, "loss": 0.0151, "step": 62100 }, { "epoch": 0.67, "learning_rate": 0.00019928325874035154, "loss": 0.0175, "step": 62110 }, { "epoch": 0.67, "learning_rate": 0.00019926704287474866, "loss": 0.0181, "step": 62120 }, { "epoch": 0.67, "learning_rate": 0.00019925082700914573, "loss": 0.0175, "step": 62130 }, { "epoch": 0.67, "learning_rate": 0.00019923461114354282, "loss": 0.0151, "step": 62140 }, { "epoch": 0.67, "learning_rate": 0.0001992183952779399, "loss": 0.0165, "step": 62150 }, { "epoch": 0.67, "learning_rate": 0.00019920217941233703, "loss": 0.018, "step": 62160 }, { "epoch": 0.67, "learning_rate": 0.0001991859635467341, "loss": 0.017, "step": 62170 }, { "epoch": 0.67, "learning_rate": 0.0001991697476811312, "loss": 0.0133, "step": 62180 }, { "epoch": 0.67, "learning_rate": 0.0001991535318155283, "loss": 0.0127, "step": 62190 }, { "epoch": 0.67, "learning_rate": 0.0001991373159499254, "loss": 0.0135, "step": 62200 }, { "epoch": 0.67, "learning_rate": 0.00019912110008432247, "loss": 0.0159, "step": 62210 }, { "epoch": 0.67, "learning_rate": 0.00019910488421871956, "loss": 0.0175, "step": 62220 }, { "epoch": 0.67, "learning_rate": 0.00019908866835311668, "loss": 0.0136, "step": 62230 }, { "epoch": 0.67, "learning_rate": 0.00019907245248751377, "loss": 0.0167, "step": 62240 }, { "epoch": 0.67, "learning_rate": 0.00019905623662191084, "loss": 0.0142, "step": 62250 }, { "epoch": 0.67, "learning_rate": 0.00019904002075630796, "loss": 0.0129, "step": 62260 }, { "epoch": 0.67, "learning_rate": 0.00019902380489070505, "loss": 0.0142, "step": 62270 }, { "epoch": 0.67, "learning_rate": 0.00019900758902510215, "loss": 0.0158, "step": 62280 }, { "epoch": 0.67, "learning_rate": 0.0001989913731594992, "loss": 0.0137, "step": 62290 }, { "epoch": 0.67, "learning_rate": 0.00019897515729389633, "loss": 0.0174, "step": 62300 }, { "epoch": 0.67, "learning_rate": 0.00019895894142829342, "loss": 0.0162, "step": 62310 }, { "epoch": 0.67, "learning_rate": 0.00019894272556269054, "loss": 0.0163, "step": 62320 }, { "epoch": 0.67, "learning_rate": 0.0001989265096970876, "loss": 0.0149, "step": 62330 }, { "epoch": 0.67, "learning_rate": 0.0001989102938314847, "loss": 0.0134, "step": 62340 }, { "epoch": 0.67, "learning_rate": 0.0001988940779658818, "loss": 0.0151, "step": 62350 }, { "epoch": 0.67, "learning_rate": 0.00019887786210027891, "loss": 0.0174, "step": 62360 }, { "epoch": 0.67, "learning_rate": 0.00019886164623467598, "loss": 0.0192, "step": 62370 }, { "epoch": 0.67, "learning_rate": 0.00019884543036907307, "loss": 0.0191, "step": 62380 }, { "epoch": 0.67, "learning_rate": 0.0001988292145034702, "loss": 0.0143, "step": 62390 }, { "epoch": 0.67, "learning_rate": 0.00019881299863786729, "loss": 0.017, "step": 62400 }, { "epoch": 0.67, "learning_rate": 0.00019879678277226435, "loss": 0.0168, "step": 62410 }, { "epoch": 0.67, "learning_rate": 0.00019878056690666144, "loss": 0.0161, "step": 62420 }, { "epoch": 0.67, "learning_rate": 0.00019876435104105856, "loss": 0.0133, "step": 62430 }, { "epoch": 0.68, "learning_rate": 0.00019874813517545566, "loss": 0.0163, "step": 62440 }, { "epoch": 0.68, "learning_rate": 0.00019873191930985272, "loss": 0.0174, "step": 62450 }, { "epoch": 0.68, "learning_rate": 0.00019871570344424984, "loss": 0.0156, "step": 62460 }, { "epoch": 0.68, "learning_rate": 0.00019869948757864693, "loss": 0.0161, "step": 62470 }, { "epoch": 0.68, "learning_rate": 0.00019868327171304403, "loss": 0.0143, "step": 62480 }, { "epoch": 0.68, "learning_rate": 0.0001986670558474411, "loss": 0.016, "step": 62490 }, { "epoch": 0.68, "learning_rate": 0.0001986508399818382, "loss": 0.0166, "step": 62500 }, { "epoch": 0.68, "learning_rate": 0.0001986346241162353, "loss": 0.0158, "step": 62510 }, { "epoch": 0.68, "learning_rate": 0.0001986184082506324, "loss": 0.0195, "step": 62520 }, { "epoch": 0.68, "learning_rate": 0.0001986021923850295, "loss": 0.0167, "step": 62530 }, { "epoch": 0.68, "learning_rate": 0.00019858597651942658, "loss": 0.0153, "step": 62540 }, { "epoch": 0.68, "learning_rate": 0.00019856976065382368, "loss": 0.0156, "step": 62550 }, { "epoch": 0.68, "learning_rate": 0.0001985535447882208, "loss": 0.0202, "step": 62560 }, { "epoch": 0.68, "learning_rate": 0.00019853732892261786, "loss": 0.0142, "step": 62570 }, { "epoch": 0.68, "learning_rate": 0.00019852111305701495, "loss": 0.0151, "step": 62580 }, { "epoch": 0.68, "learning_rate": 0.00019850489719141205, "loss": 0.0178, "step": 62590 }, { "epoch": 0.68, "learning_rate": 0.00019848868132580917, "loss": 0.0161, "step": 62600 }, { "epoch": 0.68, "learning_rate": 0.00019847246546020626, "loss": 0.0156, "step": 62610 }, { "epoch": 0.68, "learning_rate": 0.00019845624959460333, "loss": 0.017, "step": 62620 }, { "epoch": 0.68, "learning_rate": 0.00019844003372900045, "loss": 0.0155, "step": 62630 }, { "epoch": 0.68, "learning_rate": 0.00019842381786339754, "loss": 0.0149, "step": 62640 }, { "epoch": 0.68, "learning_rate": 0.00019840760199779463, "loss": 0.0175, "step": 62650 }, { "epoch": 0.68, "learning_rate": 0.0001983913861321917, "loss": 0.0135, "step": 62660 }, { "epoch": 0.68, "learning_rate": 0.00019837517026658882, "loss": 0.017, "step": 62670 }, { "epoch": 0.68, "learning_rate": 0.0001983589544009859, "loss": 0.0151, "step": 62680 }, { "epoch": 0.68, "learning_rate": 0.00019834273853538303, "loss": 0.0198, "step": 62690 }, { "epoch": 0.68, "learning_rate": 0.0001983265226697801, "loss": 0.0178, "step": 62700 }, { "epoch": 0.68, "learning_rate": 0.0001983103068041772, "loss": 0.0156, "step": 62710 }, { "epoch": 0.68, "learning_rate": 0.00019829409093857428, "loss": 0.0138, "step": 62720 }, { "epoch": 0.68, "learning_rate": 0.0001982778750729714, "loss": 0.0154, "step": 62730 }, { "epoch": 0.68, "learning_rate": 0.00019826165920736847, "loss": 0.0157, "step": 62740 }, { "epoch": 0.68, "learning_rate": 0.00019824544334176556, "loss": 0.0184, "step": 62750 }, { "epoch": 0.68, "learning_rate": 0.00019822922747616268, "loss": 0.0176, "step": 62760 }, { "epoch": 0.68, "learning_rate": 0.00019821301161055977, "loss": 0.0173, "step": 62770 }, { "epoch": 0.68, "learning_rate": 0.00019819679574495684, "loss": 0.0152, "step": 62780 }, { "epoch": 0.68, "learning_rate": 0.00019818057987935393, "loss": 0.0157, "step": 62790 }, { "epoch": 0.68, "learning_rate": 0.00019816436401375105, "loss": 0.0162, "step": 62800 }, { "epoch": 0.68, "learning_rate": 0.00019814814814814814, "loss": 0.0149, "step": 62810 }, { "epoch": 0.68, "learning_rate": 0.0001981319322825452, "loss": 0.0176, "step": 62820 }, { "epoch": 0.68, "learning_rate": 0.00019811571641694233, "loss": 0.0163, "step": 62830 }, { "epoch": 0.68, "learning_rate": 0.00019809950055133942, "loss": 0.0176, "step": 62840 }, { "epoch": 0.68, "learning_rate": 0.0001980832846857365, "loss": 0.0156, "step": 62850 }, { "epoch": 0.68, "learning_rate": 0.00019806706882013358, "loss": 0.0156, "step": 62860 }, { "epoch": 0.68, "learning_rate": 0.0001980508529545307, "loss": 0.0165, "step": 62870 }, { "epoch": 0.68, "learning_rate": 0.0001980346370889278, "loss": 0.0173, "step": 62880 }, { "epoch": 0.68, "learning_rate": 0.00019801842122332488, "loss": 0.0182, "step": 62890 }, { "epoch": 0.68, "learning_rate": 0.00019800220535772198, "loss": 0.0183, "step": 62900 }, { "epoch": 0.68, "learning_rate": 0.00019798598949211907, "loss": 0.0125, "step": 62910 }, { "epoch": 0.68, "learning_rate": 0.00019796977362651616, "loss": 0.0153, "step": 62920 }, { "epoch": 0.68, "learning_rate": 0.00019795355776091328, "loss": 0.0196, "step": 62930 }, { "epoch": 0.68, "learning_rate": 0.00019793734189531035, "loss": 0.0158, "step": 62940 }, { "epoch": 0.68, "learning_rate": 0.00019792112602970744, "loss": 0.0168, "step": 62950 }, { "epoch": 0.68, "learning_rate": 0.00019790491016410453, "loss": 0.0155, "step": 62960 }, { "epoch": 0.68, "learning_rate": 0.00019788869429850165, "loss": 0.0191, "step": 62970 }, { "epoch": 0.68, "learning_rate": 0.00019787247843289872, "loss": 0.0145, "step": 62980 }, { "epoch": 0.68, "learning_rate": 0.0001978562625672958, "loss": 0.0154, "step": 62990 }, { "epoch": 0.68, "learning_rate": 0.00019784004670169293, "loss": 0.0167, "step": 63000 }, { "epoch": 0.68, "eval_cer": 0.9215590728184603, "eval_loss": 0.011219864711165428, "eval_runtime": 121.1331, "eval_samples_per_second": 16.511, "eval_steps_per_second": 4.128, "step": 63000 }, { "epoch": 0.68, "learning_rate": 0.00019782383083609002, "loss": 0.0196, "step": 63010 }, { "epoch": 0.68, "learning_rate": 0.0001978076149704871, "loss": 0.0175, "step": 63020 }, { "epoch": 0.68, "learning_rate": 0.0001977913991048842, "loss": 0.0162, "step": 63030 }, { "epoch": 0.68, "learning_rate": 0.0001977751832392813, "loss": 0.015, "step": 63040 }, { "epoch": 0.68, "learning_rate": 0.0001977589673736784, "loss": 0.0159, "step": 63050 }, { "epoch": 0.68, "learning_rate": 0.00019774275150807546, "loss": 0.0173, "step": 63060 }, { "epoch": 0.68, "learning_rate": 0.00019772653564247258, "loss": 0.0158, "step": 63070 }, { "epoch": 0.68, "learning_rate": 0.00019771031977686967, "loss": 0.0167, "step": 63080 }, { "epoch": 0.68, "learning_rate": 0.00019769410391126677, "loss": 0.0153, "step": 63090 }, { "epoch": 0.68, "learning_rate": 0.00019767788804566386, "loss": 0.0155, "step": 63100 }, { "epoch": 0.68, "learning_rate": 0.00019766167218006095, "loss": 0.0157, "step": 63110 }, { "epoch": 0.68, "learning_rate": 0.00019764545631445804, "loss": 0.0147, "step": 63120 }, { "epoch": 0.68, "learning_rate": 0.00019762924044885516, "loss": 0.0236, "step": 63130 }, { "epoch": 0.68, "learning_rate": 0.00019761302458325223, "loss": 0.0183, "step": 63140 }, { "epoch": 0.68, "learning_rate": 0.00019759680871764932, "loss": 0.0179, "step": 63150 }, { "epoch": 0.68, "learning_rate": 0.00019758059285204641, "loss": 0.0167, "step": 63160 }, { "epoch": 0.68, "learning_rate": 0.00019756437698644353, "loss": 0.0168, "step": 63170 }, { "epoch": 0.68, "learning_rate": 0.0001975481611208406, "loss": 0.0176, "step": 63180 }, { "epoch": 0.68, "learning_rate": 0.0001975319452552377, "loss": 0.0147, "step": 63190 }, { "epoch": 0.68, "learning_rate": 0.0001975157293896348, "loss": 0.0134, "step": 63200 }, { "epoch": 0.68, "learning_rate": 0.0001974995135240319, "loss": 0.0174, "step": 63210 }, { "epoch": 0.68, "learning_rate": 0.00019748329765842897, "loss": 0.0173, "step": 63220 }, { "epoch": 0.68, "learning_rate": 0.00019746708179282606, "loss": 0.0147, "step": 63230 }, { "epoch": 0.68, "learning_rate": 0.00019745086592722318, "loss": 0.0211, "step": 63240 }, { "epoch": 0.68, "learning_rate": 0.00019743465006162028, "loss": 0.0174, "step": 63250 }, { "epoch": 0.68, "learning_rate": 0.00019741843419601734, "loss": 0.0121, "step": 63260 }, { "epoch": 0.68, "learning_rate": 0.00019740221833041446, "loss": 0.0149, "step": 63270 }, { "epoch": 0.68, "learning_rate": 0.00019738600246481155, "loss": 0.0151, "step": 63280 }, { "epoch": 0.68, "learning_rate": 0.00019736978659920865, "loss": 0.0172, "step": 63290 }, { "epoch": 0.68, "learning_rate": 0.00019735357073360577, "loss": 0.0157, "step": 63300 }, { "epoch": 0.68, "learning_rate": 0.00019733735486800283, "loss": 0.0171, "step": 63310 }, { "epoch": 0.68, "learning_rate": 0.00019732113900239993, "loss": 0.0141, "step": 63320 }, { "epoch": 0.68, "learning_rate": 0.00019730492313679705, "loss": 0.0159, "step": 63330 }, { "epoch": 0.68, "learning_rate": 0.00019728870727119414, "loss": 0.0149, "step": 63340 }, { "epoch": 0.68, "learning_rate": 0.0001972724914055912, "loss": 0.0188, "step": 63350 }, { "epoch": 0.68, "learning_rate": 0.0001972562755399883, "loss": 0.0153, "step": 63360 }, { "epoch": 0.69, "learning_rate": 0.00019724005967438542, "loss": 0.0147, "step": 63370 }, { "epoch": 0.69, "learning_rate": 0.0001972238438087825, "loss": 0.0154, "step": 63380 }, { "epoch": 0.69, "learning_rate": 0.00019720762794317958, "loss": 0.0161, "step": 63390 }, { "epoch": 0.69, "learning_rate": 0.0001971914120775767, "loss": 0.0143, "step": 63400 }, { "epoch": 0.69, "learning_rate": 0.0001971751962119738, "loss": 0.0161, "step": 63410 }, { "epoch": 0.69, "learning_rate": 0.00019715898034637088, "loss": 0.0146, "step": 63420 }, { "epoch": 0.69, "learning_rate": 0.00019714276448076795, "loss": 0.0158, "step": 63430 }, { "epoch": 0.69, "learning_rate": 0.00019712654861516507, "loss": 0.013, "step": 63440 }, { "epoch": 0.69, "learning_rate": 0.00019711033274956216, "loss": 0.0156, "step": 63450 }, { "epoch": 0.69, "learning_rate": 0.00019709411688395925, "loss": 0.0162, "step": 63460 }, { "epoch": 0.69, "learning_rate": 0.00019707790101835634, "loss": 0.0153, "step": 63470 }, { "epoch": 0.69, "learning_rate": 0.00019706168515275344, "loss": 0.0128, "step": 63480 }, { "epoch": 0.69, "learning_rate": 0.00019704546928715053, "loss": 0.0172, "step": 63490 }, { "epoch": 0.69, "learning_rate": 0.00019702925342154765, "loss": 0.0128, "step": 63500 }, { "epoch": 0.69, "learning_rate": 0.00019701303755594472, "loss": 0.0152, "step": 63510 }, { "epoch": 0.69, "learning_rate": 0.0001969968216903418, "loss": 0.0149, "step": 63520 }, { "epoch": 0.69, "learning_rate": 0.0001969806058247389, "loss": 0.0136, "step": 63530 }, { "epoch": 0.69, "learning_rate": 0.00019696438995913602, "loss": 0.0134, "step": 63540 }, { "epoch": 0.69, "learning_rate": 0.00019694817409353309, "loss": 0.0148, "step": 63550 }, { "epoch": 0.69, "learning_rate": 0.00019693195822793018, "loss": 0.0165, "step": 63560 }, { "epoch": 0.69, "learning_rate": 0.0001969157423623273, "loss": 0.0159, "step": 63570 }, { "epoch": 0.69, "learning_rate": 0.0001968995264967244, "loss": 0.0146, "step": 63580 }, { "epoch": 0.69, "learning_rate": 0.00019688331063112146, "loss": 0.0152, "step": 63590 }, { "epoch": 0.69, "learning_rate": 0.00019686709476551855, "loss": 0.0189, "step": 63600 }, { "epoch": 0.69, "learning_rate": 0.00019685087889991567, "loss": 0.0131, "step": 63610 }, { "epoch": 0.69, "learning_rate": 0.00019683466303431276, "loss": 0.0158, "step": 63620 }, { "epoch": 0.69, "learning_rate": 0.00019681844716870983, "loss": 0.0138, "step": 63630 }, { "epoch": 0.69, "learning_rate": 0.00019680223130310695, "loss": 0.0192, "step": 63640 }, { "epoch": 0.69, "learning_rate": 0.00019678601543750404, "loss": 0.0166, "step": 63650 }, { "epoch": 0.69, "learning_rate": 0.00019676979957190113, "loss": 0.0158, "step": 63660 }, { "epoch": 0.69, "learning_rate": 0.0001967535837062982, "loss": 0.0153, "step": 63670 }, { "epoch": 0.69, "learning_rate": 0.00019673736784069532, "loss": 0.0194, "step": 63680 }, { "epoch": 0.69, "learning_rate": 0.0001967211519750924, "loss": 0.0137, "step": 63690 }, { "epoch": 0.69, "learning_rate": 0.00019670493610948953, "loss": 0.0158, "step": 63700 }, { "epoch": 0.69, "learning_rate": 0.0001966887202438866, "loss": 0.0186, "step": 63710 }, { "epoch": 0.69, "learning_rate": 0.0001966725043782837, "loss": 0.0156, "step": 63720 }, { "epoch": 0.69, "learning_rate": 0.00019665628851268078, "loss": 0.0165, "step": 63730 }, { "epoch": 0.69, "learning_rate": 0.0001966400726470779, "loss": 0.0163, "step": 63740 }, { "epoch": 0.69, "learning_rate": 0.00019662385678147497, "loss": 0.0128, "step": 63750 }, { "epoch": 0.69, "learning_rate": 0.00019660764091587206, "loss": 0.0166, "step": 63760 }, { "epoch": 0.69, "learning_rate": 0.00019659142505026918, "loss": 0.0202, "step": 63770 }, { "epoch": 0.69, "learning_rate": 0.00019657520918466627, "loss": 0.0173, "step": 63780 }, { "epoch": 0.69, "learning_rate": 0.00019655899331906334, "loss": 0.0179, "step": 63790 }, { "epoch": 0.69, "learning_rate": 0.00019654277745346043, "loss": 0.0165, "step": 63800 }, { "epoch": 0.69, "learning_rate": 0.00019652656158785755, "loss": 0.0169, "step": 63810 }, { "epoch": 0.69, "learning_rate": 0.00019651034572225464, "loss": 0.0163, "step": 63820 }, { "epoch": 0.69, "learning_rate": 0.0001964941298566517, "loss": 0.0161, "step": 63830 }, { "epoch": 0.69, "learning_rate": 0.00019647791399104883, "loss": 0.0172, "step": 63840 }, { "epoch": 0.69, "learning_rate": 0.00019646169812544592, "loss": 0.0197, "step": 63850 }, { "epoch": 0.69, "learning_rate": 0.00019644548225984302, "loss": 0.0162, "step": 63860 }, { "epoch": 0.69, "learning_rate": 0.00019642926639424008, "loss": 0.0172, "step": 63870 }, { "epoch": 0.69, "learning_rate": 0.0001964130505286372, "loss": 0.0145, "step": 63880 }, { "epoch": 0.69, "learning_rate": 0.0001963968346630343, "loss": 0.0156, "step": 63890 }, { "epoch": 0.69, "learning_rate": 0.00019638061879743139, "loss": 0.0165, "step": 63900 }, { "epoch": 0.69, "learning_rate": 0.00019636440293182848, "loss": 0.019, "step": 63910 }, { "epoch": 0.69, "learning_rate": 0.00019634818706622557, "loss": 0.0141, "step": 63920 }, { "epoch": 0.69, "learning_rate": 0.00019633197120062266, "loss": 0.0151, "step": 63930 }, { "epoch": 0.69, "learning_rate": 0.00019631575533501978, "loss": 0.0172, "step": 63940 }, { "epoch": 0.69, "learning_rate": 0.00019629953946941685, "loss": 0.0167, "step": 63950 }, { "epoch": 0.69, "learning_rate": 0.00019628332360381394, "loss": 0.0155, "step": 63960 }, { "epoch": 0.69, "learning_rate": 0.00019626710773821104, "loss": 0.013, "step": 63970 }, { "epoch": 0.69, "learning_rate": 0.00019625089187260816, "loss": 0.015, "step": 63980 }, { "epoch": 0.69, "learning_rate": 0.00019623467600700522, "loss": 0.012, "step": 63990 }, { "epoch": 0.69, "learning_rate": 0.00019621846014140231, "loss": 0.0163, "step": 64000 }, { "epoch": 0.69, "eval_cer": 0.9215434379652454, "eval_loss": 0.01114691887050867, "eval_runtime": 121.2239, "eval_samples_per_second": 16.498, "eval_steps_per_second": 4.125, "step": 64000 }, { "epoch": 0.69, "learning_rate": 0.00019620224427579943, "loss": 0.016, "step": 64010 }, { "epoch": 0.69, "learning_rate": 0.00019618602841019653, "loss": 0.014, "step": 64020 }, { "epoch": 0.69, "learning_rate": 0.00019616981254459362, "loss": 0.0171, "step": 64030 }, { "epoch": 0.69, "learning_rate": 0.0001961535966789907, "loss": 0.0209, "step": 64040 }, { "epoch": 0.69, "learning_rate": 0.0001961373808133878, "loss": 0.0122, "step": 64050 }, { "epoch": 0.69, "learning_rate": 0.0001961211649477849, "loss": 0.016, "step": 64060 }, { "epoch": 0.69, "learning_rate": 0.00019610494908218202, "loss": 0.0133, "step": 64070 }, { "epoch": 0.69, "learning_rate": 0.00019608873321657908, "loss": 0.0137, "step": 64080 }, { "epoch": 0.69, "learning_rate": 0.00019607251735097618, "loss": 0.0141, "step": 64090 }, { "epoch": 0.69, "learning_rate": 0.00019605630148537327, "loss": 0.0166, "step": 64100 }, { "epoch": 0.69, "learning_rate": 0.0001960400856197704, "loss": 0.017, "step": 64110 }, { "epoch": 0.69, "learning_rate": 0.00019602386975416745, "loss": 0.0189, "step": 64120 }, { "epoch": 0.69, "learning_rate": 0.00019600765388856455, "loss": 0.0164, "step": 64130 }, { "epoch": 0.69, "learning_rate": 0.00019599143802296167, "loss": 0.0173, "step": 64140 }, { "epoch": 0.69, "learning_rate": 0.00019597522215735876, "loss": 0.0165, "step": 64150 }, { "epoch": 0.69, "learning_rate": 0.00019595900629175582, "loss": 0.0138, "step": 64160 }, { "epoch": 0.69, "learning_rate": 0.00019594279042615292, "loss": 0.0115, "step": 64170 }, { "epoch": 0.69, "learning_rate": 0.00019592657456055004, "loss": 0.0179, "step": 64180 }, { "epoch": 0.69, "learning_rate": 0.00019591035869494713, "loss": 0.0152, "step": 64190 }, { "epoch": 0.69, "learning_rate": 0.0001958941428293442, "loss": 0.0152, "step": 64200 }, { "epoch": 0.69, "learning_rate": 0.00019587792696374132, "loss": 0.0166, "step": 64210 }, { "epoch": 0.69, "learning_rate": 0.0001958617110981384, "loss": 0.017, "step": 64220 }, { "epoch": 0.69, "learning_rate": 0.0001958454952325355, "loss": 0.0146, "step": 64230 }, { "epoch": 0.69, "learning_rate": 0.00019582927936693257, "loss": 0.0149, "step": 64240 }, { "epoch": 0.69, "learning_rate": 0.0001958130635013297, "loss": 0.0195, "step": 64250 }, { "epoch": 0.69, "learning_rate": 0.00019579684763572678, "loss": 0.0163, "step": 64260 }, { "epoch": 0.69, "learning_rate": 0.0001957806317701239, "loss": 0.0138, "step": 64270 }, { "epoch": 0.69, "learning_rate": 0.00019576441590452096, "loss": 0.0161, "step": 64280 }, { "epoch": 0.7, "learning_rate": 0.00019574820003891806, "loss": 0.016, "step": 64290 }, { "epoch": 0.7, "learning_rate": 0.00019573198417331515, "loss": 0.0167, "step": 64300 }, { "epoch": 0.7, "learning_rate": 0.00019571576830771227, "loss": 0.018, "step": 64310 }, { "epoch": 0.7, "learning_rate": 0.00019569955244210934, "loss": 0.0151, "step": 64320 }, { "epoch": 0.7, "learning_rate": 0.00019568333657650643, "loss": 0.0164, "step": 64330 }, { "epoch": 0.7, "learning_rate": 0.00019566712071090355, "loss": 0.0162, "step": 64340 }, { "epoch": 0.7, "learning_rate": 0.00019565090484530064, "loss": 0.014, "step": 64350 }, { "epoch": 0.7, "learning_rate": 0.0001956346889796977, "loss": 0.0171, "step": 64360 }, { "epoch": 0.7, "learning_rate": 0.0001956184731140948, "loss": 0.0144, "step": 64370 }, { "epoch": 0.7, "learning_rate": 0.00019560225724849192, "loss": 0.0153, "step": 64380 }, { "epoch": 0.7, "learning_rate": 0.000195586041382889, "loss": 0.0152, "step": 64390 }, { "epoch": 0.7, "learning_rate": 0.00019556982551728608, "loss": 0.0177, "step": 64400 }, { "epoch": 0.7, "learning_rate": 0.0001955536096516832, "loss": 0.0153, "step": 64410 }, { "epoch": 0.7, "learning_rate": 0.0001955373937860803, "loss": 0.0163, "step": 64420 }, { "epoch": 0.7, "learning_rate": 0.00019552117792047738, "loss": 0.0178, "step": 64430 }, { "epoch": 0.7, "learning_rate": 0.00019550496205487445, "loss": 0.0134, "step": 64440 }, { "epoch": 0.7, "learning_rate": 0.00019548874618927157, "loss": 0.0142, "step": 64450 }, { "epoch": 0.7, "learning_rate": 0.00019547253032366866, "loss": 0.0142, "step": 64460 }, { "epoch": 0.7, "learning_rate": 0.00019545631445806575, "loss": 0.0178, "step": 64470 }, { "epoch": 0.7, "learning_rate": 0.00019544009859246285, "loss": 0.014, "step": 64480 }, { "epoch": 0.7, "learning_rate": 0.00019542388272685994, "loss": 0.0156, "step": 64490 }, { "epoch": 0.7, "learning_rate": 0.00019540766686125703, "loss": 0.0158, "step": 64500 }, { "epoch": 0.7, "learning_rate": 0.00019539145099565415, "loss": 0.0144, "step": 64510 }, { "epoch": 0.7, "learning_rate": 0.00019537523513005122, "loss": 0.0182, "step": 64520 }, { "epoch": 0.7, "learning_rate": 0.0001953590192644483, "loss": 0.0151, "step": 64530 }, { "epoch": 0.7, "learning_rate": 0.0001953428033988454, "loss": 0.0177, "step": 64540 }, { "epoch": 0.7, "learning_rate": 0.00019532658753324252, "loss": 0.0162, "step": 64550 }, { "epoch": 0.7, "learning_rate": 0.0001953103716676396, "loss": 0.0154, "step": 64560 }, { "epoch": 0.7, "learning_rate": 0.00019529415580203668, "loss": 0.0195, "step": 64570 }, { "epoch": 0.7, "learning_rate": 0.0001952779399364338, "loss": 0.0183, "step": 64580 }, { "epoch": 0.7, "learning_rate": 0.0001952617240708309, "loss": 0.0129, "step": 64590 }, { "epoch": 0.7, "learning_rate": 0.00019524550820522796, "loss": 0.0135, "step": 64600 }, { "epoch": 0.7, "learning_rate": 0.00019522929233962505, "loss": 0.0145, "step": 64610 }, { "epoch": 0.7, "learning_rate": 0.00019521307647402217, "loss": 0.0136, "step": 64620 }, { "epoch": 0.7, "learning_rate": 0.00019519686060841927, "loss": 0.0145, "step": 64630 }, { "epoch": 0.7, "learning_rate": 0.00019518064474281633, "loss": 0.0173, "step": 64640 }, { "epoch": 0.7, "learning_rate": 0.00019516442887721345, "loss": 0.0142, "step": 64650 }, { "epoch": 0.7, "learning_rate": 0.00019514821301161054, "loss": 0.015, "step": 64660 }, { "epoch": 0.7, "learning_rate": 0.00019513199714600764, "loss": 0.0193, "step": 64670 }, { "epoch": 0.7, "learning_rate": 0.0001951157812804047, "loss": 0.0141, "step": 64680 }, { "epoch": 0.7, "learning_rate": 0.00019509956541480182, "loss": 0.0138, "step": 64690 }, { "epoch": 0.7, "learning_rate": 0.00019508334954919891, "loss": 0.0201, "step": 64700 }, { "epoch": 0.7, "learning_rate": 0.00019506713368359603, "loss": 0.0149, "step": 64710 }, { "epoch": 0.7, "learning_rate": 0.0001950509178179931, "loss": 0.0166, "step": 64720 }, { "epoch": 0.7, "learning_rate": 0.0001950347019523902, "loss": 0.0165, "step": 64730 }, { "epoch": 0.7, "learning_rate": 0.00019501848608678729, "loss": 0.0143, "step": 64740 }, { "epoch": 0.7, "learning_rate": 0.0001950022702211844, "loss": 0.0193, "step": 64750 }, { "epoch": 0.7, "learning_rate": 0.0001949860543555815, "loss": 0.0122, "step": 64760 }, { "epoch": 0.7, "learning_rate": 0.00019496983848997856, "loss": 0.015, "step": 64770 }, { "epoch": 0.7, "learning_rate": 0.00019495362262437568, "loss": 0.0144, "step": 64780 }, { "epoch": 0.7, "learning_rate": 0.00019493740675877278, "loss": 0.019, "step": 64790 }, { "epoch": 0.7, "learning_rate": 0.00019492119089316987, "loss": 0.0156, "step": 64800 }, { "epoch": 0.7, "learning_rate": 0.00019490497502756693, "loss": 0.0157, "step": 64810 }, { "epoch": 0.7, "learning_rate": 0.00019488875916196405, "loss": 0.0152, "step": 64820 }, { "epoch": 0.7, "learning_rate": 0.00019487254329636115, "loss": 0.0171, "step": 64830 }, { "epoch": 0.7, "learning_rate": 0.00019485632743075824, "loss": 0.0206, "step": 64840 }, { "epoch": 0.7, "learning_rate": 0.00019484011156515533, "loss": 0.0173, "step": 64850 }, { "epoch": 0.7, "learning_rate": 0.00019482389569955243, "loss": 0.0182, "step": 64860 }, { "epoch": 0.7, "learning_rate": 0.00019480767983394952, "loss": 0.0126, "step": 64870 }, { "epoch": 0.7, "learning_rate": 0.00019479146396834664, "loss": 0.0155, "step": 64880 }, { "epoch": 0.7, "learning_rate": 0.0001947752481027437, "loss": 0.0238, "step": 64890 }, { "epoch": 0.7, "learning_rate": 0.0001947590322371408, "loss": 0.0146, "step": 64900 }, { "epoch": 0.7, "learning_rate": 0.0001947428163715379, "loss": 0.0146, "step": 64910 }, { "epoch": 0.7, "learning_rate": 0.000194726600505935, "loss": 0.0145, "step": 64920 }, { "epoch": 0.7, "learning_rate": 0.00019471038464033207, "loss": 0.012, "step": 64930 }, { "epoch": 0.7, "learning_rate": 0.00019469416877472917, "loss": 0.015, "step": 64940 }, { "epoch": 0.7, "learning_rate": 0.0001946779529091263, "loss": 0.0167, "step": 64950 }, { "epoch": 0.7, "learning_rate": 0.00019466173704352338, "loss": 0.0123, "step": 64960 }, { "epoch": 0.7, "learning_rate": 0.00019464552117792045, "loss": 0.0177, "step": 64970 }, { "epoch": 0.7, "learning_rate": 0.00019462930531231754, "loss": 0.0124, "step": 64980 }, { "epoch": 0.7, "learning_rate": 0.00019461308944671466, "loss": 0.0137, "step": 64990 }, { "epoch": 0.7, "learning_rate": 0.00019459687358111175, "loss": 0.0128, "step": 65000 }, { "epoch": 0.7, "eval_cer": 0.921535620538638, "eval_loss": 0.011012510396540165, "eval_runtime": 121.262, "eval_samples_per_second": 16.493, "eval_steps_per_second": 4.123, "step": 65000 }, { "epoch": 0.7, "learning_rate": 0.00019458065771550882, "loss": 0.0179, "step": 65010 }, { "epoch": 0.7, "learning_rate": 0.00019456444184990594, "loss": 0.0162, "step": 65020 }, { "epoch": 0.7, "learning_rate": 0.00019454822598430303, "loss": 0.0159, "step": 65030 }, { "epoch": 0.7, "learning_rate": 0.00019453201011870012, "loss": 0.0121, "step": 65040 }, { "epoch": 0.7, "learning_rate": 0.00019451579425309721, "loss": 0.0147, "step": 65050 }, { "epoch": 0.7, "learning_rate": 0.0001944995783874943, "loss": 0.0127, "step": 65060 }, { "epoch": 0.7, "learning_rate": 0.0001944833625218914, "loss": 0.0135, "step": 65070 }, { "epoch": 0.7, "learning_rate": 0.00019446714665628852, "loss": 0.0161, "step": 65080 }, { "epoch": 0.7, "learning_rate": 0.00019445093079068559, "loss": 0.0129, "step": 65090 }, { "epoch": 0.7, "learning_rate": 0.00019443471492508268, "loss": 0.0205, "step": 65100 }, { "epoch": 0.7, "learning_rate": 0.00019441849905947977, "loss": 0.0176, "step": 65110 }, { "epoch": 0.7, "learning_rate": 0.0001944022831938769, "loss": 0.0163, "step": 65120 }, { "epoch": 0.7, "learning_rate": 0.00019438606732827396, "loss": 0.0138, "step": 65130 }, { "epoch": 0.7, "learning_rate": 0.00019436985146267105, "loss": 0.0166, "step": 65140 }, { "epoch": 0.7, "learning_rate": 0.00019435363559706817, "loss": 0.0161, "step": 65150 }, { "epoch": 0.7, "learning_rate": 0.00019433741973146526, "loss": 0.0168, "step": 65160 }, { "epoch": 0.7, "learning_rate": 0.00019432120386586233, "loss": 0.0157, "step": 65170 }, { "epoch": 0.7, "learning_rate": 0.00019430498800025942, "loss": 0.0163, "step": 65180 }, { "epoch": 0.7, "learning_rate": 0.00019428877213465654, "loss": 0.0141, "step": 65190 }, { "epoch": 0.7, "learning_rate": 0.00019427255626905363, "loss": 0.0154, "step": 65200 }, { "epoch": 0.7, "learning_rate": 0.0001942563404034507, "loss": 0.0154, "step": 65210 }, { "epoch": 0.71, "learning_rate": 0.00019424012453784782, "loss": 0.0157, "step": 65220 }, { "epoch": 0.71, "learning_rate": 0.0001942239086722449, "loss": 0.0145, "step": 65230 }, { "epoch": 0.71, "learning_rate": 0.000194207692806642, "loss": 0.0179, "step": 65240 }, { "epoch": 0.71, "learning_rate": 0.00019419147694103907, "loss": 0.0134, "step": 65250 }, { "epoch": 0.71, "learning_rate": 0.0001941752610754362, "loss": 0.0146, "step": 65260 }, { "epoch": 0.71, "learning_rate": 0.00019415904520983328, "loss": 0.0201, "step": 65270 }, { "epoch": 0.71, "learning_rate": 0.0001941428293442304, "loss": 0.0198, "step": 65280 }, { "epoch": 0.71, "learning_rate": 0.00019412661347862747, "loss": 0.0149, "step": 65290 }, { "epoch": 0.71, "learning_rate": 0.00019411039761302456, "loss": 0.017, "step": 65300 }, { "epoch": 0.71, "learning_rate": 0.00019409418174742165, "loss": 0.0123, "step": 65310 }, { "epoch": 0.71, "learning_rate": 0.00019407796588181877, "loss": 0.0146, "step": 65320 }, { "epoch": 0.71, "learning_rate": 0.00019406175001621584, "loss": 0.0146, "step": 65330 }, { "epoch": 0.71, "learning_rate": 0.00019404553415061293, "loss": 0.0149, "step": 65340 }, { "epoch": 0.71, "learning_rate": 0.00019402931828501005, "loss": 0.013, "step": 65350 }, { "epoch": 0.71, "learning_rate": 0.00019401310241940714, "loss": 0.0123, "step": 65360 }, { "epoch": 0.71, "learning_rate": 0.0001939968865538042, "loss": 0.0132, "step": 65370 }, { "epoch": 0.71, "learning_rate": 0.0001939806706882013, "loss": 0.0167, "step": 65380 }, { "epoch": 0.71, "learning_rate": 0.00019396445482259842, "loss": 0.0127, "step": 65390 }, { "epoch": 0.71, "learning_rate": 0.00019394823895699551, "loss": 0.013, "step": 65400 }, { "epoch": 0.71, "learning_rate": 0.00019393202309139258, "loss": 0.0135, "step": 65410 }, { "epoch": 0.71, "learning_rate": 0.0001939158072257897, "loss": 0.0183, "step": 65420 }, { "epoch": 0.71, "learning_rate": 0.0001938995913601868, "loss": 0.0162, "step": 65430 }, { "epoch": 0.71, "learning_rate": 0.00019388337549458389, "loss": 0.0151, "step": 65440 }, { "epoch": 0.71, "learning_rate": 0.00019386715962898095, "loss": 0.014, "step": 65450 }, { "epoch": 0.71, "learning_rate": 0.00019385094376337807, "loss": 0.0146, "step": 65460 }, { "epoch": 0.71, "learning_rate": 0.00019383472789777516, "loss": 0.017, "step": 65470 }, { "epoch": 0.71, "learning_rate": 0.00019381851203217226, "loss": 0.0163, "step": 65480 }, { "epoch": 0.71, "learning_rate": 0.00019380229616656938, "loss": 0.0132, "step": 65490 }, { "epoch": 0.71, "learning_rate": 0.00019378608030096644, "loss": 0.0162, "step": 65500 }, { "epoch": 0.71, "learning_rate": 0.00019376986443536353, "loss": 0.0131, "step": 65510 }, { "epoch": 0.71, "learning_rate": 0.00019375364856976065, "loss": 0.0149, "step": 65520 }, { "epoch": 0.71, "learning_rate": 0.00019373743270415775, "loss": 0.0134, "step": 65530 }, { "epoch": 0.71, "learning_rate": 0.0001937212168385548, "loss": 0.0144, "step": 65540 }, { "epoch": 0.71, "learning_rate": 0.0001937050009729519, "loss": 0.0143, "step": 65550 }, { "epoch": 0.71, "learning_rate": 0.00019368878510734903, "loss": 0.0134, "step": 65560 }, { "epoch": 0.71, "learning_rate": 0.00019367256924174612, "loss": 0.0173, "step": 65570 }, { "epoch": 0.71, "learning_rate": 0.00019365635337614318, "loss": 0.017, "step": 65580 }, { "epoch": 0.71, "learning_rate": 0.0001936401375105403, "loss": 0.0164, "step": 65590 }, { "epoch": 0.71, "learning_rate": 0.0001936239216449374, "loss": 0.0155, "step": 65600 }, { "epoch": 0.71, "learning_rate": 0.0001936077057793345, "loss": 0.0163, "step": 65610 }, { "epoch": 0.71, "learning_rate": 0.00019359148991373156, "loss": 0.0151, "step": 65620 }, { "epoch": 0.71, "learning_rate": 0.00019357527404812867, "loss": 0.0156, "step": 65630 }, { "epoch": 0.71, "learning_rate": 0.00019355905818252577, "loss": 0.0155, "step": 65640 }, { "epoch": 0.71, "learning_rate": 0.0001935428423169229, "loss": 0.0166, "step": 65650 }, { "epoch": 0.71, "learning_rate": 0.00019352662645131995, "loss": 0.0189, "step": 65660 }, { "epoch": 0.71, "learning_rate": 0.00019351041058571705, "loss": 0.0135, "step": 65670 }, { "epoch": 0.71, "learning_rate": 0.00019349419472011414, "loss": 0.015, "step": 65680 }, { "epoch": 0.71, "learning_rate": 0.00019347797885451126, "loss": 0.0137, "step": 65690 }, { "epoch": 0.71, "learning_rate": 0.00019346176298890832, "loss": 0.016, "step": 65700 }, { "epoch": 0.71, "learning_rate": 0.00019344554712330542, "loss": 0.0133, "step": 65710 }, { "epoch": 0.71, "learning_rate": 0.00019342933125770254, "loss": 0.0129, "step": 65720 }, { "epoch": 0.71, "learning_rate": 0.00019341311539209963, "loss": 0.0157, "step": 65730 }, { "epoch": 0.71, "learning_rate": 0.0001933968995264967, "loss": 0.0161, "step": 65740 }, { "epoch": 0.71, "learning_rate": 0.0001933806836608938, "loss": 0.0157, "step": 65750 }, { "epoch": 0.71, "learning_rate": 0.0001933644677952909, "loss": 0.0136, "step": 65760 }, { "epoch": 0.71, "learning_rate": 0.000193348251929688, "loss": 0.0144, "step": 65770 }, { "epoch": 0.71, "learning_rate": 0.00019333203606408507, "loss": 0.0165, "step": 65780 }, { "epoch": 0.71, "learning_rate": 0.00019331582019848219, "loss": 0.0161, "step": 65790 }, { "epoch": 0.71, "learning_rate": 0.00019329960433287928, "loss": 0.0148, "step": 65800 }, { "epoch": 0.71, "learning_rate": 0.00019328338846727637, "loss": 0.0178, "step": 65810 }, { "epoch": 0.71, "learning_rate": 0.00019326717260167344, "loss": 0.0169, "step": 65820 }, { "epoch": 0.71, "learning_rate": 0.00019325095673607056, "loss": 0.0139, "step": 65830 }, { "epoch": 0.71, "learning_rate": 0.00019323474087046765, "loss": 0.0121, "step": 65840 }, { "epoch": 0.71, "learning_rate": 0.00019321852500486474, "loss": 0.015, "step": 65850 }, { "epoch": 0.71, "learning_rate": 0.00019320230913926184, "loss": 0.0155, "step": 65860 }, { "epoch": 0.71, "learning_rate": 0.00019318609327365893, "loss": 0.0141, "step": 65870 }, { "epoch": 0.71, "learning_rate": 0.00019316987740805602, "loss": 0.0175, "step": 65880 }, { "epoch": 0.71, "learning_rate": 0.00019315366154245314, "loss": 0.0132, "step": 65890 }, { "epoch": 0.71, "learning_rate": 0.0001931374456768502, "loss": 0.0175, "step": 65900 }, { "epoch": 0.71, "learning_rate": 0.0001931212298112473, "loss": 0.0144, "step": 65910 }, { "epoch": 0.71, "learning_rate": 0.0001931050139456444, "loss": 0.0172, "step": 65920 }, { "epoch": 0.71, "learning_rate": 0.0001930887980800415, "loss": 0.0136, "step": 65930 }, { "epoch": 0.71, "learning_rate": 0.00019307258221443858, "loss": 0.0171, "step": 65940 }, { "epoch": 0.71, "learning_rate": 0.00019305636634883567, "loss": 0.0192, "step": 65950 }, { "epoch": 0.71, "learning_rate": 0.0001930401504832328, "loss": 0.0198, "step": 65960 }, { "epoch": 0.71, "learning_rate": 0.00019302393461762988, "loss": 0.017, "step": 65970 }, { "epoch": 0.71, "learning_rate": 0.00019300771875202695, "loss": 0.0164, "step": 65980 }, { "epoch": 0.71, "learning_rate": 0.00019299150288642404, "loss": 0.0195, "step": 65990 }, { "epoch": 0.71, "learning_rate": 0.00019297528702082116, "loss": 0.0178, "step": 66000 }, { "epoch": 0.71, "eval_cer": 0.9215451751711582, "eval_loss": 0.011317442171275616, "eval_runtime": 121.212, "eval_samples_per_second": 16.5, "eval_steps_per_second": 4.125, "step": 66000 }, { "epoch": 0.71, "learning_rate": 0.00019295907115521825, "loss": 0.0174, "step": 66010 }, { "epoch": 0.71, "learning_rate": 0.00019294285528961532, "loss": 0.0161, "step": 66020 }, { "epoch": 0.71, "learning_rate": 0.00019292663942401244, "loss": 0.0122, "step": 66030 }, { "epoch": 0.71, "learning_rate": 0.00019291042355840953, "loss": 0.0125, "step": 66040 }, { "epoch": 0.71, "learning_rate": 0.00019289420769280662, "loss": 0.0157, "step": 66050 }, { "epoch": 0.71, "learning_rate": 0.00019287799182720372, "loss": 0.0176, "step": 66060 }, { "epoch": 0.71, "learning_rate": 0.0001928617759616008, "loss": 0.015, "step": 66070 }, { "epoch": 0.71, "learning_rate": 0.0001928455600959979, "loss": 0.0156, "step": 66080 }, { "epoch": 0.71, "learning_rate": 0.00019282934423039502, "loss": 0.0173, "step": 66090 }, { "epoch": 0.71, "learning_rate": 0.0001928131283647921, "loss": 0.0168, "step": 66100 }, { "epoch": 0.71, "learning_rate": 0.00019279691249918918, "loss": 0.0169, "step": 66110 }, { "epoch": 0.71, "learning_rate": 0.00019278069663358627, "loss": 0.0141, "step": 66120 }, { "epoch": 0.71, "learning_rate": 0.0001927644807679834, "loss": 0.0161, "step": 66130 }, { "epoch": 0.72, "learning_rate": 0.00019274826490238046, "loss": 0.014, "step": 66140 }, { "epoch": 0.72, "learning_rate": 0.00019273204903677755, "loss": 0.0141, "step": 66150 }, { "epoch": 0.72, "learning_rate": 0.00019271583317117467, "loss": 0.0157, "step": 66160 }, { "epoch": 0.72, "learning_rate": 0.00019269961730557176, "loss": 0.0146, "step": 66170 }, { "epoch": 0.72, "learning_rate": 0.00019268340143996886, "loss": 0.0123, "step": 66180 }, { "epoch": 0.72, "learning_rate": 0.00019266718557436592, "loss": 0.0139, "step": 66190 }, { "epoch": 0.72, "learning_rate": 0.00019265096970876304, "loss": 0.0164, "step": 66200 }, { "epoch": 0.72, "learning_rate": 0.00019263475384316014, "loss": 0.0164, "step": 66210 }, { "epoch": 0.72, "learning_rate": 0.00019261853797755723, "loss": 0.0176, "step": 66220 }, { "epoch": 0.72, "learning_rate": 0.00019260232211195432, "loss": 0.0146, "step": 66230 }, { "epoch": 0.72, "learning_rate": 0.00019258610624635141, "loss": 0.0193, "step": 66240 }, { "epoch": 0.72, "learning_rate": 0.0001925698903807485, "loss": 0.015, "step": 66250 }, { "epoch": 0.72, "learning_rate": 0.00019255367451514563, "loss": 0.0219, "step": 66260 }, { "epoch": 0.72, "learning_rate": 0.0001925374586495427, "loss": 0.0172, "step": 66270 }, { "epoch": 0.72, "learning_rate": 0.00019252124278393978, "loss": 0.0137, "step": 66280 }, { "epoch": 0.72, "learning_rate": 0.0001925050269183369, "loss": 0.0139, "step": 66290 }, { "epoch": 0.72, "learning_rate": 0.000192488811052734, "loss": 0.0155, "step": 66300 }, { "epoch": 0.72, "learning_rate": 0.00019247259518713106, "loss": 0.015, "step": 66310 }, { "epoch": 0.72, "learning_rate": 0.00019245637932152816, "loss": 0.0155, "step": 66320 }, { "epoch": 0.72, "learning_rate": 0.00019244016345592528, "loss": 0.0193, "step": 66330 }, { "epoch": 0.72, "learning_rate": 0.00019242394759032237, "loss": 0.0221, "step": 66340 }, { "epoch": 0.72, "learning_rate": 0.00019240773172471943, "loss": 0.0181, "step": 66350 }, { "epoch": 0.72, "learning_rate": 0.00019239151585911655, "loss": 0.0136, "step": 66360 }, { "epoch": 0.72, "learning_rate": 0.00019237529999351365, "loss": 0.0198, "step": 66370 }, { "epoch": 0.72, "learning_rate": 0.00019235908412791074, "loss": 0.0168, "step": 66380 }, { "epoch": 0.72, "learning_rate": 0.0001923428682623078, "loss": 0.0135, "step": 66390 }, { "epoch": 0.72, "learning_rate": 0.00019232665239670492, "loss": 0.0318, "step": 66400 }, { "epoch": 0.72, "learning_rate": 0.00019231043653110202, "loss": 0.0237, "step": 66410 }, { "epoch": 0.72, "learning_rate": 0.0001922942206654991, "loss": 0.0142, "step": 66420 }, { "epoch": 0.72, "learning_rate": 0.0001922780047998962, "loss": 0.0145, "step": 66430 }, { "epoch": 0.72, "learning_rate": 0.0001922617889342933, "loss": 0.0188, "step": 66440 }, { "epoch": 0.72, "learning_rate": 0.0001922455730686904, "loss": 0.0172, "step": 66450 }, { "epoch": 0.72, "learning_rate": 0.0001922293572030875, "loss": 0.0172, "step": 66460 }, { "epoch": 0.72, "learning_rate": 0.00019221314133748457, "loss": 0.0158, "step": 66470 }, { "epoch": 0.72, "learning_rate": 0.00019219692547188167, "loss": 0.0186, "step": 66480 }, { "epoch": 0.72, "learning_rate": 0.00019218070960627876, "loss": 0.0152, "step": 66490 }, { "epoch": 0.72, "learning_rate": 0.00019216449374067588, "loss": 0.0144, "step": 66500 }, { "epoch": 0.72, "learning_rate": 0.00019214827787507294, "loss": 0.0128, "step": 66510 }, { "epoch": 0.72, "learning_rate": 0.00019213206200947004, "loss": 0.0138, "step": 66520 }, { "epoch": 0.72, "learning_rate": 0.00019211584614386716, "loss": 0.0159, "step": 66530 }, { "epoch": 0.72, "learning_rate": 0.00019209963027826425, "loss": 0.0149, "step": 66540 }, { "epoch": 0.72, "learning_rate": 0.00019208341441266132, "loss": 0.023, "step": 66550 }, { "epoch": 0.72, "learning_rate": 0.0001920671985470584, "loss": 0.0183, "step": 66560 }, { "epoch": 0.72, "learning_rate": 0.00019205098268145553, "loss": 0.019, "step": 66570 }, { "epoch": 0.72, "learning_rate": 0.00019203476681585262, "loss": 0.0167, "step": 66580 }, { "epoch": 0.72, "learning_rate": 0.0001920185509502497, "loss": 0.0199, "step": 66590 }, { "epoch": 0.72, "learning_rate": 0.0001920023350846468, "loss": 0.0147, "step": 66600 }, { "epoch": 0.72, "learning_rate": 0.0001919861192190439, "loss": 0.0144, "step": 66610 }, { "epoch": 0.72, "learning_rate": 0.000191969903353441, "loss": 0.0148, "step": 66620 }, { "epoch": 0.72, "learning_rate": 0.00019195368748783806, "loss": 0.0171, "step": 66630 }, { "epoch": 0.72, "learning_rate": 0.00019193747162223518, "loss": 0.0171, "step": 66640 }, { "epoch": 0.72, "learning_rate": 0.00019192125575663227, "loss": 0.015, "step": 66650 }, { "epoch": 0.72, "learning_rate": 0.0001919050398910294, "loss": 0.0152, "step": 66660 }, { "epoch": 0.72, "learning_rate": 0.00019188882402542646, "loss": 0.0137, "step": 66670 }, { "epoch": 0.72, "learning_rate": 0.00019187260815982355, "loss": 0.0162, "step": 66680 }, { "epoch": 0.72, "learning_rate": 0.00019185639229422064, "loss": 0.0147, "step": 66690 }, { "epoch": 0.72, "learning_rate": 0.00019184017642861776, "loss": 0.0197, "step": 66700 }, { "epoch": 0.72, "learning_rate": 0.00019182396056301483, "loss": 0.0173, "step": 66710 }, { "epoch": 0.72, "learning_rate": 0.00019180774469741192, "loss": 0.0156, "step": 66720 }, { "epoch": 0.72, "learning_rate": 0.00019179152883180904, "loss": 0.0124, "step": 66730 }, { "epoch": 0.72, "learning_rate": 0.00019177531296620613, "loss": 0.0149, "step": 66740 }, { "epoch": 0.72, "learning_rate": 0.0001917590971006032, "loss": 0.0175, "step": 66750 }, { "epoch": 0.72, "learning_rate": 0.0001917428812350003, "loss": 0.0148, "step": 66760 }, { "epoch": 0.72, "learning_rate": 0.0001917266653693974, "loss": 0.019, "step": 66770 }, { "epoch": 0.72, "learning_rate": 0.0001917104495037945, "loss": 0.016, "step": 66780 }, { "epoch": 0.72, "learning_rate": 0.00019169423363819157, "loss": 0.0154, "step": 66790 }, { "epoch": 0.72, "learning_rate": 0.0001916780177725887, "loss": 0.0109, "step": 66800 }, { "epoch": 0.72, "learning_rate": 0.00019166180190698578, "loss": 0.0148, "step": 66810 }, { "epoch": 0.72, "learning_rate": 0.00019164558604138287, "loss": 0.013, "step": 66820 }, { "epoch": 0.72, "learning_rate": 0.00019162937017577994, "loss": 0.0209, "step": 66830 }, { "epoch": 0.72, "learning_rate": 0.00019161315431017706, "loss": 0.0141, "step": 66840 }, { "epoch": 0.72, "learning_rate": 0.00019159693844457415, "loss": 0.0156, "step": 66850 }, { "epoch": 0.72, "learning_rate": 0.00019158072257897125, "loss": 0.0153, "step": 66860 }, { "epoch": 0.72, "learning_rate": 0.00019156450671336834, "loss": 0.0153, "step": 66870 }, { "epoch": 0.72, "learning_rate": 0.00019154829084776543, "loss": 0.014, "step": 66880 }, { "epoch": 0.72, "learning_rate": 0.00019153207498216252, "loss": 0.0168, "step": 66890 }, { "epoch": 0.72, "learning_rate": 0.00019151585911655964, "loss": 0.0197, "step": 66900 }, { "epoch": 0.72, "learning_rate": 0.00019149964325095674, "loss": 0.0152, "step": 66910 }, { "epoch": 0.72, "learning_rate": 0.0001914834273853538, "loss": 0.0164, "step": 66920 }, { "epoch": 0.72, "learning_rate": 0.0001914672115197509, "loss": 0.012, "step": 66930 }, { "epoch": 0.72, "learning_rate": 0.00019145099565414801, "loss": 0.014, "step": 66940 }, { "epoch": 0.72, "learning_rate": 0.0001914347797885451, "loss": 0.0145, "step": 66950 }, { "epoch": 0.72, "learning_rate": 0.00019141856392294217, "loss": 0.0151, "step": 66960 }, { "epoch": 0.72, "learning_rate": 0.0001914023480573393, "loss": 0.0133, "step": 66970 }, { "epoch": 0.72, "learning_rate": 0.00019138613219173639, "loss": 0.0181, "step": 66980 }, { "epoch": 0.72, "learning_rate": 0.00019136991632613348, "loss": 0.0143, "step": 66990 }, { "epoch": 0.72, "learning_rate": 0.00019135370046053054, "loss": 0.0142, "step": 67000 }, { "epoch": 0.72, "eval_cer": 0.921521722891336, "eval_loss": 0.010987049899995327, "eval_runtime": 121.4092, "eval_samples_per_second": 16.473, "eval_steps_per_second": 4.118, "step": 67000 }, { "epoch": 0.72, "learning_rate": 0.00019133748459492766, "loss": 0.0133, "step": 67010 }, { "epoch": 0.72, "learning_rate": 0.00019132126872932476, "loss": 0.0152, "step": 67020 }, { "epoch": 0.72, "learning_rate": 0.00019130505286372188, "loss": 0.0148, "step": 67030 }, { "epoch": 0.72, "learning_rate": 0.00019128883699811894, "loss": 0.0159, "step": 67040 }, { "epoch": 0.72, "learning_rate": 0.00019127262113251603, "loss": 0.0155, "step": 67050 }, { "epoch": 0.72, "learning_rate": 0.00019125640526691313, "loss": 0.0157, "step": 67060 }, { "epoch": 0.73, "learning_rate": 0.00019124018940131025, "loss": 0.0165, "step": 67070 }, { "epoch": 0.73, "learning_rate": 0.0001912239735357073, "loss": 0.0138, "step": 67080 }, { "epoch": 0.73, "learning_rate": 0.0001912077576701044, "loss": 0.0134, "step": 67090 }, { "epoch": 0.73, "learning_rate": 0.00019119154180450153, "loss": 0.0184, "step": 67100 }, { "epoch": 0.73, "learning_rate": 0.00019117532593889862, "loss": 0.0162, "step": 67110 }, { "epoch": 0.73, "learning_rate": 0.00019115911007329568, "loss": 0.0189, "step": 67120 }, { "epoch": 0.73, "learning_rate": 0.00019114289420769278, "loss": 0.0152, "step": 67130 }, { "epoch": 0.73, "learning_rate": 0.0001911266783420899, "loss": 0.0143, "step": 67140 }, { "epoch": 0.73, "learning_rate": 0.000191110462476487, "loss": 0.0153, "step": 67150 }, { "epoch": 0.73, "learning_rate": 0.00019109424661088405, "loss": 0.0182, "step": 67160 }, { "epoch": 0.73, "learning_rate": 0.00019107803074528117, "loss": 0.017, "step": 67170 }, { "epoch": 0.73, "learning_rate": 0.00019106181487967827, "loss": 0.0146, "step": 67180 }, { "epoch": 0.73, "learning_rate": 0.00019104559901407536, "loss": 0.0154, "step": 67190 }, { "epoch": 0.73, "learning_rate": 0.00019102938314847243, "loss": 0.0153, "step": 67200 }, { "epoch": 0.73, "learning_rate": 0.00019101316728286955, "loss": 0.013, "step": 67210 }, { "epoch": 0.73, "learning_rate": 0.00019099695141726664, "loss": 0.0153, "step": 67220 }, { "epoch": 0.73, "learning_rate": 0.00019098073555166373, "loss": 0.0154, "step": 67230 }, { "epoch": 0.73, "learning_rate": 0.00019096451968606082, "loss": 0.015, "step": 67240 }, { "epoch": 0.73, "learning_rate": 0.00019094830382045792, "loss": 0.0158, "step": 67250 }, { "epoch": 0.73, "learning_rate": 0.000190932087954855, "loss": 0.0118, "step": 67260 }, { "epoch": 0.73, "learning_rate": 0.00019091587208925213, "loss": 0.0206, "step": 67270 }, { "epoch": 0.73, "learning_rate": 0.0001908996562236492, "loss": 0.0147, "step": 67280 }, { "epoch": 0.73, "learning_rate": 0.0001908834403580463, "loss": 0.0145, "step": 67290 }, { "epoch": 0.73, "learning_rate": 0.0001908672244924434, "loss": 0.0148, "step": 67300 }, { "epoch": 0.73, "learning_rate": 0.0001908510086268405, "loss": 0.0145, "step": 67310 }, { "epoch": 0.73, "learning_rate": 0.00019083479276123757, "loss": 0.0178, "step": 67320 }, { "epoch": 0.73, "learning_rate": 0.00019081857689563466, "loss": 0.0169, "step": 67330 }, { "epoch": 0.73, "learning_rate": 0.00019080236103003178, "loss": 0.0206, "step": 67340 }, { "epoch": 0.73, "learning_rate": 0.00019078614516442887, "loss": 0.0179, "step": 67350 }, { "epoch": 0.73, "learning_rate": 0.00019076992929882594, "loss": 0.0126, "step": 67360 }, { "epoch": 0.73, "learning_rate": 0.00019075371343322306, "loss": 0.0157, "step": 67370 }, { "epoch": 0.73, "learning_rate": 0.00019073749756762015, "loss": 0.0165, "step": 67380 }, { "epoch": 0.73, "learning_rate": 0.00019072128170201724, "loss": 0.0197, "step": 67390 }, { "epoch": 0.73, "learning_rate": 0.0001907050658364143, "loss": 0.0141, "step": 67400 }, { "epoch": 0.73, "learning_rate": 0.00019068884997081143, "loss": 0.0165, "step": 67410 }, { "epoch": 0.73, "learning_rate": 0.00019067263410520852, "loss": 0.0137, "step": 67420 }, { "epoch": 0.73, "learning_rate": 0.0001906564182396056, "loss": 0.0124, "step": 67430 }, { "epoch": 0.73, "learning_rate": 0.0001906402023740027, "loss": 0.0127, "step": 67440 }, { "epoch": 0.73, "learning_rate": 0.0001906239865083998, "loss": 0.0129, "step": 67450 }, { "epoch": 0.73, "learning_rate": 0.0001906077706427969, "loss": 0.0145, "step": 67460 }, { "epoch": 0.73, "learning_rate": 0.000190591554777194, "loss": 0.0143, "step": 67470 }, { "epoch": 0.73, "learning_rate": 0.00019057533891159108, "loss": 0.0156, "step": 67480 }, { "epoch": 0.73, "learning_rate": 0.00019055912304598817, "loss": 0.0178, "step": 67490 }, { "epoch": 0.73, "learning_rate": 0.00019054290718038526, "loss": 0.0179, "step": 67500 }, { "epoch": 0.73, "learning_rate": 0.00019052669131478238, "loss": 0.0195, "step": 67510 }, { "epoch": 0.73, "learning_rate": 0.00019051047544917945, "loss": 0.0179, "step": 67520 }, { "epoch": 0.73, "learning_rate": 0.00019049425958357654, "loss": 0.0145, "step": 67530 }, { "epoch": 0.73, "learning_rate": 0.00019047804371797366, "loss": 0.0172, "step": 67540 }, { "epoch": 0.73, "learning_rate": 0.00019046182785237075, "loss": 0.0165, "step": 67550 }, { "epoch": 0.73, "learning_rate": 0.00019044561198676782, "loss": 0.0138, "step": 67560 }, { "epoch": 0.73, "learning_rate": 0.0001904293961211649, "loss": 0.0169, "step": 67570 }, { "epoch": 0.73, "learning_rate": 0.00019041318025556203, "loss": 0.0195, "step": 67580 }, { "epoch": 0.73, "learning_rate": 0.00019039696438995912, "loss": 0.0158, "step": 67590 }, { "epoch": 0.73, "learning_rate": 0.0001903807485243562, "loss": 0.0138, "step": 67600 }, { "epoch": 0.73, "learning_rate": 0.0001903645326587533, "loss": 0.0154, "step": 67610 }, { "epoch": 0.73, "learning_rate": 0.0001903483167931504, "loss": 0.013, "step": 67620 }, { "epoch": 0.73, "learning_rate": 0.0001903321009275475, "loss": 0.017, "step": 67630 }, { "epoch": 0.73, "learning_rate": 0.00019031588506194461, "loss": 0.016, "step": 67640 }, { "epoch": 0.73, "learning_rate": 0.00019029966919634168, "loss": 0.0171, "step": 67650 }, { "epoch": 0.73, "learning_rate": 0.00019028345333073877, "loss": 0.0184, "step": 67660 }, { "epoch": 0.73, "learning_rate": 0.0001902672374651359, "loss": 0.0199, "step": 67670 }, { "epoch": 0.73, "learning_rate": 0.00019025102159953299, "loss": 0.0159, "step": 67680 }, { "epoch": 0.73, "learning_rate": 0.00019023480573393005, "loss": 0.0193, "step": 67690 }, { "epoch": 0.73, "learning_rate": 0.00019021858986832714, "loss": 0.0164, "step": 67700 }, { "epoch": 0.73, "learning_rate": 0.00019020237400272426, "loss": 0.0215, "step": 67710 }, { "epoch": 0.73, "learning_rate": 0.00019018615813712136, "loss": 0.0159, "step": 67720 }, { "epoch": 0.73, "learning_rate": 0.00019016994227151842, "loss": 0.0193, "step": 67730 }, { "epoch": 0.73, "learning_rate": 0.00019015372640591554, "loss": 0.0282, "step": 67740 }, { "epoch": 0.73, "learning_rate": 0.00019013751054031263, "loss": 0.017, "step": 67750 }, { "epoch": 0.73, "learning_rate": 0.00019012129467470973, "loss": 0.0169, "step": 67760 }, { "epoch": 0.73, "learning_rate": 0.0001901050788091068, "loss": 0.0161, "step": 67770 }, { "epoch": 0.73, "learning_rate": 0.0001900888629435039, "loss": 0.0157, "step": 67780 }, { "epoch": 0.73, "learning_rate": 0.000190072647077901, "loss": 0.0194, "step": 67790 }, { "epoch": 0.73, "learning_rate": 0.0001900564312122981, "loss": 0.0154, "step": 67800 }, { "epoch": 0.73, "learning_rate": 0.0001900402153466952, "loss": 0.0203, "step": 67810 }, { "epoch": 0.73, "learning_rate": 0.00019002399948109228, "loss": 0.0143, "step": 67820 }, { "epoch": 0.73, "learning_rate": 0.00019000778361548938, "loss": 0.0202, "step": 67830 }, { "epoch": 0.73, "learning_rate": 0.0001899915677498865, "loss": 0.0171, "step": 67840 }, { "epoch": 0.73, "learning_rate": 0.00018997535188428356, "loss": 0.0192, "step": 67850 }, { "epoch": 0.73, "learning_rate": 0.00018995913601868065, "loss": 0.0136, "step": 67860 }, { "epoch": 0.73, "learning_rate": 0.00018994292015307775, "loss": 0.0155, "step": 67870 }, { "epoch": 0.73, "learning_rate": 0.00018992670428747487, "loss": 0.0196, "step": 67880 }, { "epoch": 0.73, "learning_rate": 0.00018991048842187193, "loss": 0.0155, "step": 67890 }, { "epoch": 0.73, "learning_rate": 0.00018989427255626903, "loss": 0.0185, "step": 67900 }, { "epoch": 0.73, "learning_rate": 0.00018987805669066615, "loss": 0.0146, "step": 67910 }, { "epoch": 0.73, "learning_rate": 0.00018986184082506324, "loss": 0.0135, "step": 67920 }, { "epoch": 0.73, "learning_rate": 0.0001898456249594603, "loss": 0.016, "step": 67930 }, { "epoch": 0.73, "learning_rate": 0.0001898294090938574, "loss": 0.017, "step": 67940 }, { "epoch": 0.73, "learning_rate": 0.00018981319322825452, "loss": 0.0159, "step": 67950 }, { "epoch": 0.73, "learning_rate": 0.0001897969773626516, "loss": 0.0192, "step": 67960 }, { "epoch": 0.73, "learning_rate": 0.00018978076149704868, "loss": 0.0138, "step": 67970 }, { "epoch": 0.73, "learning_rate": 0.0001897645456314458, "loss": 0.0149, "step": 67980 }, { "epoch": 0.74, "learning_rate": 0.0001897483297658429, "loss": 0.0155, "step": 67990 }, { "epoch": 0.74, "learning_rate": 0.00018973211390023998, "loss": 0.0143, "step": 68000 }, { "epoch": 0.74, "eval_cer": 0.921535620538638, "eval_loss": 0.010959140956401825, "eval_runtime": 121.0862, "eval_samples_per_second": 16.517, "eval_steps_per_second": 4.129, "step": 68000 }, { "epoch": 0.74, "learning_rate": 0.00018971589803463705, "loss": 0.0131, "step": 68010 }, { "epoch": 0.74, "learning_rate": 0.00018969968216903417, "loss": 0.0131, "step": 68020 }, { "epoch": 0.74, "learning_rate": 0.00018968346630343126, "loss": 0.0144, "step": 68030 }, { "epoch": 0.74, "learning_rate": 0.00018966725043782838, "loss": 0.0119, "step": 68040 }, { "epoch": 0.74, "learning_rate": 0.00018965103457222544, "loss": 0.0213, "step": 68050 }, { "epoch": 0.74, "learning_rate": 0.00018963481870662254, "loss": 0.0156, "step": 68060 }, { "epoch": 0.74, "learning_rate": 0.00018961860284101963, "loss": 0.0166, "step": 68070 }, { "epoch": 0.74, "learning_rate": 0.00018960238697541675, "loss": 0.0159, "step": 68080 }, { "epoch": 0.74, "learning_rate": 0.00018958617110981382, "loss": 0.0154, "step": 68090 }, { "epoch": 0.74, "learning_rate": 0.0001895699552442109, "loss": 0.0155, "step": 68100 }, { "epoch": 0.74, "learning_rate": 0.00018955373937860803, "loss": 0.0153, "step": 68110 }, { "epoch": 0.74, "learning_rate": 0.00018953752351300512, "loss": 0.0184, "step": 68120 }, { "epoch": 0.74, "learning_rate": 0.00018952130764740219, "loss": 0.012, "step": 68130 }, { "epoch": 0.74, "learning_rate": 0.00018950509178179928, "loss": 0.0139, "step": 68140 }, { "epoch": 0.74, "learning_rate": 0.0001894888759161964, "loss": 0.016, "step": 68150 }, { "epoch": 0.74, "learning_rate": 0.0001894726600505935, "loss": 0.0124, "step": 68160 }, { "epoch": 0.74, "learning_rate": 0.00018945644418499056, "loss": 0.0145, "step": 68170 }, { "epoch": 0.74, "learning_rate": 0.00018944022831938768, "loss": 0.0168, "step": 68180 }, { "epoch": 0.74, "learning_rate": 0.00018942401245378477, "loss": 0.0169, "step": 68190 }, { "epoch": 0.74, "learning_rate": 0.00018940779658818186, "loss": 0.0161, "step": 68200 }, { "epoch": 0.74, "learning_rate": 0.00018939158072257893, "loss": 0.0134, "step": 68210 }, { "epoch": 0.74, "learning_rate": 0.00018937536485697605, "loss": 0.0149, "step": 68220 }, { "epoch": 0.74, "learning_rate": 0.00018935914899137314, "loss": 0.0128, "step": 68230 }, { "epoch": 0.74, "learning_rate": 0.00018934293312577023, "loss": 0.0139, "step": 68240 }, { "epoch": 0.74, "learning_rate": 0.00018932671726016733, "loss": 0.0142, "step": 68250 }, { "epoch": 0.74, "learning_rate": 0.00018931050139456442, "loss": 0.0134, "step": 68260 }, { "epoch": 0.74, "learning_rate": 0.0001892942855289615, "loss": 0.0133, "step": 68270 }, { "epoch": 0.74, "learning_rate": 0.00018927806966335863, "loss": 0.0175, "step": 68280 }, { "epoch": 0.74, "learning_rate": 0.0001892618537977557, "loss": 0.0124, "step": 68290 }, { "epoch": 0.74, "learning_rate": 0.0001892456379321528, "loss": 0.0154, "step": 68300 }, { "epoch": 0.74, "learning_rate": 0.0001892294220665499, "loss": 0.0146, "step": 68310 }, { "epoch": 0.74, "learning_rate": 0.000189213206200947, "loss": 0.0145, "step": 68320 }, { "epoch": 0.74, "learning_rate": 0.00018919699033534407, "loss": 0.015, "step": 68330 }, { "epoch": 0.74, "learning_rate": 0.00018918077446974116, "loss": 0.0149, "step": 68340 }, { "epoch": 0.74, "learning_rate": 0.00018916455860413828, "loss": 0.0147, "step": 68350 }, { "epoch": 0.74, "learning_rate": 0.00018914834273853537, "loss": 0.0161, "step": 68360 }, { "epoch": 0.74, "learning_rate": 0.00018913212687293247, "loss": 0.0144, "step": 68370 }, { "epoch": 0.74, "learning_rate": 0.00018911591100732956, "loss": 0.0176, "step": 68380 }, { "epoch": 0.74, "learning_rate": 0.00018909969514172665, "loss": 0.0149, "step": 68390 }, { "epoch": 0.74, "learning_rate": 0.00018908347927612374, "loss": 0.0125, "step": 68400 }, { "epoch": 0.74, "learning_rate": 0.00018906726341052086, "loss": 0.0159, "step": 68410 }, { "epoch": 0.74, "learning_rate": 0.00018905104754491793, "loss": 0.0159, "step": 68420 }, { "epoch": 0.74, "learning_rate": 0.00018903483167931502, "loss": 0.0134, "step": 68430 }, { "epoch": 0.74, "learning_rate": 0.00018901861581371212, "loss": 0.0204, "step": 68440 }, { "epoch": 0.74, "learning_rate": 0.00018900239994810924, "loss": 0.0138, "step": 68450 }, { "epoch": 0.74, "learning_rate": 0.0001889861840825063, "loss": 0.0129, "step": 68460 }, { "epoch": 0.74, "learning_rate": 0.0001889699682169034, "loss": 0.0133, "step": 68470 }, { "epoch": 0.74, "learning_rate": 0.0001889537523513005, "loss": 0.0139, "step": 68480 }, { "epoch": 0.74, "learning_rate": 0.0001889375364856976, "loss": 0.0166, "step": 68490 }, { "epoch": 0.74, "learning_rate": 0.00018892132062009467, "loss": 0.018, "step": 68500 }, { "epoch": 0.74, "learning_rate": 0.00018890510475449176, "loss": 0.0143, "step": 68510 }, { "epoch": 0.74, "learning_rate": 0.00018888888888888888, "loss": 0.0188, "step": 68520 }, { "epoch": 0.74, "learning_rate": 0.00018887267302328598, "loss": 0.0129, "step": 68530 }, { "epoch": 0.74, "learning_rate": 0.00018885645715768304, "loss": 0.0172, "step": 68540 }, { "epoch": 0.74, "learning_rate": 0.00018884024129208016, "loss": 0.0146, "step": 68550 }, { "epoch": 0.74, "learning_rate": 0.00018882402542647726, "loss": 0.015, "step": 68560 }, { "epoch": 0.74, "learning_rate": 0.00018880780956087435, "loss": 0.0154, "step": 68570 }, { "epoch": 0.74, "learning_rate": 0.00018879159369527141, "loss": 0.0168, "step": 68580 }, { "epoch": 0.74, "learning_rate": 0.00018877537782966853, "loss": 0.0158, "step": 68590 }, { "epoch": 0.74, "learning_rate": 0.00018875916196406563, "loss": 0.0124, "step": 68600 }, { "epoch": 0.74, "learning_rate": 0.00018874294609846275, "loss": 0.0147, "step": 68610 }, { "epoch": 0.74, "learning_rate": 0.0001887267302328598, "loss": 0.0176, "step": 68620 }, { "epoch": 0.74, "learning_rate": 0.0001887105143672569, "loss": 0.0145, "step": 68630 }, { "epoch": 0.74, "learning_rate": 0.000188694298501654, "loss": 0.0131, "step": 68640 }, { "epoch": 0.74, "learning_rate": 0.00018867808263605112, "loss": 0.0149, "step": 68650 }, { "epoch": 0.74, "learning_rate": 0.00018866186677044818, "loss": 0.0145, "step": 68660 }, { "epoch": 0.74, "learning_rate": 0.00018864565090484528, "loss": 0.0148, "step": 68670 }, { "epoch": 0.74, "learning_rate": 0.0001886294350392424, "loss": 0.0196, "step": 68680 }, { "epoch": 0.74, "learning_rate": 0.0001886132191736395, "loss": 0.0134, "step": 68690 }, { "epoch": 0.74, "learning_rate": 0.00018859700330803655, "loss": 0.0159, "step": 68700 }, { "epoch": 0.74, "learning_rate": 0.00018858078744243365, "loss": 0.0147, "step": 68710 }, { "epoch": 0.74, "learning_rate": 0.00018856457157683077, "loss": 0.0143, "step": 68720 }, { "epoch": 0.74, "learning_rate": 0.00018854835571122786, "loss": 0.0169, "step": 68730 }, { "epoch": 0.74, "learning_rate": 0.00018853213984562492, "loss": 0.0155, "step": 68740 }, { "epoch": 0.74, "learning_rate": 0.00018851592398002204, "loss": 0.0146, "step": 68750 }, { "epoch": 0.74, "learning_rate": 0.00018849970811441914, "loss": 0.016, "step": 68760 }, { "epoch": 0.74, "learning_rate": 0.00018848349224881623, "loss": 0.0147, "step": 68770 }, { "epoch": 0.74, "learning_rate": 0.0001884672763832133, "loss": 0.0133, "step": 68780 }, { "epoch": 0.74, "learning_rate": 0.00018845106051761042, "loss": 0.0172, "step": 68790 }, { "epoch": 0.74, "learning_rate": 0.0001884348446520075, "loss": 0.0179, "step": 68800 }, { "epoch": 0.74, "learning_rate": 0.0001884186287864046, "loss": 0.0138, "step": 68810 }, { "epoch": 0.74, "learning_rate": 0.0001884024129208017, "loss": 0.0183, "step": 68820 }, { "epoch": 0.74, "learning_rate": 0.0001883861970551988, "loss": 0.0143, "step": 68830 }, { "epoch": 0.74, "learning_rate": 0.00018836998118959588, "loss": 0.0163, "step": 68840 }, { "epoch": 0.74, "learning_rate": 0.000188353765323993, "loss": 0.0145, "step": 68850 }, { "epoch": 0.74, "learning_rate": 0.00018833754945839006, "loss": 0.0148, "step": 68860 }, { "epoch": 0.74, "learning_rate": 0.00018832133359278716, "loss": 0.0174, "step": 68870 }, { "epoch": 0.74, "learning_rate": 0.00018830511772718425, "loss": 0.0151, "step": 68880 }, { "epoch": 0.74, "learning_rate": 0.00018828890186158137, "loss": 0.014, "step": 68890 }, { "epoch": 0.74, "learning_rate": 0.00018827268599597844, "loss": 0.0133, "step": 68900 }, { "epoch": 0.74, "learning_rate": 0.00018825647013037553, "loss": 0.0162, "step": 68910 }, { "epoch": 0.75, "learning_rate": 0.00018824025426477265, "loss": 0.0163, "step": 68920 }, { "epoch": 0.75, "learning_rate": 0.00018822403839916974, "loss": 0.014, "step": 68930 }, { "epoch": 0.75, "learning_rate": 0.0001882078225335668, "loss": 0.0164, "step": 68940 }, { "epoch": 0.75, "learning_rate": 0.0001881916066679639, "loss": 0.0132, "step": 68950 }, { "epoch": 0.75, "learning_rate": 0.00018817539080236102, "loss": 0.0145, "step": 68960 }, { "epoch": 0.75, "learning_rate": 0.0001881591749367581, "loss": 0.0135, "step": 68970 }, { "epoch": 0.75, "learning_rate": 0.00018814295907115518, "loss": 0.0165, "step": 68980 }, { "epoch": 0.75, "learning_rate": 0.0001881267432055523, "loss": 0.0175, "step": 68990 }, { "epoch": 0.75, "learning_rate": 0.0001881105273399494, "loss": 0.0168, "step": 69000 }, { "epoch": 0.75, "eval_cer": 0.921567758848024, "eval_loss": 0.010564006865024567, "eval_runtime": 121.2365, "eval_samples_per_second": 16.497, "eval_steps_per_second": 4.124, "step": 69000 }, { "epoch": 0.75, "learning_rate": 0.00018809431147434648, "loss": 0.014, "step": 69010 }, { "epoch": 0.75, "learning_rate": 0.00018807809560874355, "loss": 0.0152, "step": 69020 }, { "epoch": 0.75, "learning_rate": 0.00018806187974314067, "loss": 0.0165, "step": 69030 }, { "epoch": 0.75, "learning_rate": 0.00018804566387753776, "loss": 0.0118, "step": 69040 }, { "epoch": 0.75, "learning_rate": 0.00018802944801193488, "loss": 0.0188, "step": 69050 }, { "epoch": 0.75, "learning_rate": 0.00018801323214633197, "loss": 0.0162, "step": 69060 }, { "epoch": 0.75, "learning_rate": 0.00018799701628072904, "loss": 0.0165, "step": 69070 }, { "epoch": 0.75, "learning_rate": 0.00018798080041512613, "loss": 0.0153, "step": 69080 }, { "epoch": 0.75, "learning_rate": 0.00018796458454952325, "loss": 0.0142, "step": 69090 }, { "epoch": 0.75, "learning_rate": 0.00018794836868392034, "loss": 0.0134, "step": 69100 }, { "epoch": 0.75, "learning_rate": 0.0001879321528183174, "loss": 0.0155, "step": 69110 }, { "epoch": 0.75, "learning_rate": 0.00018791593695271453, "loss": 0.0144, "step": 69120 }, { "epoch": 0.75, "learning_rate": 0.00018789972108711162, "loss": 0.0113, "step": 69130 }, { "epoch": 0.75, "learning_rate": 0.00018788350522150872, "loss": 0.0164, "step": 69140 }, { "epoch": 0.75, "learning_rate": 0.00018786728935590578, "loss": 0.0113, "step": 69150 }, { "epoch": 0.75, "learning_rate": 0.0001878510734903029, "loss": 0.0125, "step": 69160 }, { "epoch": 0.75, "learning_rate": 0.0001878348576247, "loss": 0.0128, "step": 69170 }, { "epoch": 0.75, "learning_rate": 0.0001878186417590971, "loss": 0.0124, "step": 69180 }, { "epoch": 0.75, "learning_rate": 0.00018780242589349418, "loss": 0.0157, "step": 69190 }, { "epoch": 0.75, "learning_rate": 0.00018778621002789127, "loss": 0.0153, "step": 69200 }, { "epoch": 0.75, "learning_rate": 0.00018776999416228837, "loss": 0.0152, "step": 69210 }, { "epoch": 0.75, "learning_rate": 0.00018775377829668548, "loss": 0.0146, "step": 69220 }, { "epoch": 0.75, "learning_rate": 0.00018773756243108255, "loss": 0.0131, "step": 69230 }, { "epoch": 0.75, "learning_rate": 0.00018772134656547964, "loss": 0.0138, "step": 69240 }, { "epoch": 0.75, "learning_rate": 0.00018770513069987674, "loss": 0.0128, "step": 69250 }, { "epoch": 0.75, "learning_rate": 0.00018768891483427386, "loss": 0.0144, "step": 69260 }, { "epoch": 0.75, "learning_rate": 0.00018767269896867092, "loss": 0.0141, "step": 69270 }, { "epoch": 0.75, "learning_rate": 0.00018765648310306801, "loss": 0.0178, "step": 69280 }, { "epoch": 0.75, "learning_rate": 0.00018764026723746513, "loss": 0.0162, "step": 69290 }, { "epoch": 0.75, "learning_rate": 0.00018762405137186223, "loss": 0.0154, "step": 69300 }, { "epoch": 0.75, "learning_rate": 0.0001876078355062593, "loss": 0.0121, "step": 69310 }, { "epoch": 0.75, "learning_rate": 0.00018759161964065639, "loss": 0.0127, "step": 69320 }, { "epoch": 0.75, "learning_rate": 0.0001875754037750535, "loss": 0.0154, "step": 69330 }, { "epoch": 0.75, "learning_rate": 0.0001875591879094506, "loss": 0.0131, "step": 69340 }, { "epoch": 0.75, "learning_rate": 0.00018754297204384766, "loss": 0.0162, "step": 69350 }, { "epoch": 0.75, "learning_rate": 0.00018752675617824478, "loss": 0.0186, "step": 69360 }, { "epoch": 0.75, "learning_rate": 0.00018751054031264188, "loss": 0.0149, "step": 69370 }, { "epoch": 0.75, "learning_rate": 0.00018749432444703897, "loss": 0.0158, "step": 69380 }, { "epoch": 0.75, "learning_rate": 0.00018747810858143606, "loss": 0.0131, "step": 69390 }, { "epoch": 0.75, "learning_rate": 0.00018746189271583315, "loss": 0.0149, "step": 69400 }, { "epoch": 0.75, "learning_rate": 0.00018744567685023025, "loss": 0.0152, "step": 69410 }, { "epoch": 0.75, "learning_rate": 0.00018742946098462737, "loss": 0.0161, "step": 69420 }, { "epoch": 0.75, "learning_rate": 0.00018741324511902443, "loss": 0.0124, "step": 69430 }, { "epoch": 0.75, "learning_rate": 0.00018739702925342153, "loss": 0.0153, "step": 69440 }, { "epoch": 0.75, "learning_rate": 0.00018738081338781862, "loss": 0.0135, "step": 69450 }, { "epoch": 0.75, "learning_rate": 0.00018736459752221574, "loss": 0.0211, "step": 69460 }, { "epoch": 0.75, "learning_rate": 0.0001873483816566128, "loss": 0.016, "step": 69470 }, { "epoch": 0.75, "learning_rate": 0.0001873321657910099, "loss": 0.0138, "step": 69480 }, { "epoch": 0.75, "learning_rate": 0.00018731594992540702, "loss": 0.0147, "step": 69490 }, { "epoch": 0.75, "learning_rate": 0.0001872997340598041, "loss": 0.0143, "step": 69500 }, { "epoch": 0.75, "learning_rate": 0.00018728351819420117, "loss": 0.0178, "step": 69510 }, { "epoch": 0.75, "learning_rate": 0.00018726730232859827, "loss": 0.0198, "step": 69520 }, { "epoch": 0.75, "learning_rate": 0.0001872510864629954, "loss": 0.0145, "step": 69530 }, { "epoch": 0.75, "learning_rate": 0.00018723487059739248, "loss": 0.0153, "step": 69540 }, { "epoch": 0.75, "learning_rate": 0.00018721865473178955, "loss": 0.0141, "step": 69550 }, { "epoch": 0.75, "learning_rate": 0.00018720243886618667, "loss": 0.0143, "step": 69560 }, { "epoch": 0.75, "learning_rate": 0.00018718622300058376, "loss": 0.0143, "step": 69570 }, { "epoch": 0.75, "learning_rate": 0.00018717000713498085, "loss": 0.0164, "step": 69580 }, { "epoch": 0.75, "learning_rate": 0.00018715379126937792, "loss": 0.0146, "step": 69590 }, { "epoch": 0.75, "learning_rate": 0.00018713757540377504, "loss": 0.0147, "step": 69600 }, { "epoch": 0.75, "learning_rate": 0.00018712135953817213, "loss": 0.0154, "step": 69610 }, { "epoch": 0.75, "learning_rate": 0.00018710514367256925, "loss": 0.0123, "step": 69620 }, { "epoch": 0.75, "learning_rate": 0.00018708892780696631, "loss": 0.0155, "step": 69630 }, { "epoch": 0.75, "learning_rate": 0.0001870727119413634, "loss": 0.0111, "step": 69640 }, { "epoch": 0.75, "learning_rate": 0.0001870564960757605, "loss": 0.0142, "step": 69650 }, { "epoch": 0.75, "learning_rate": 0.00018704028021015762, "loss": 0.0131, "step": 69660 }, { "epoch": 0.75, "learning_rate": 0.00018702406434455469, "loss": 0.0162, "step": 69670 }, { "epoch": 0.75, "learning_rate": 0.00018700784847895178, "loss": 0.0131, "step": 69680 }, { "epoch": 0.75, "learning_rate": 0.0001869916326133489, "loss": 0.0138, "step": 69690 }, { "epoch": 0.75, "learning_rate": 0.000186975416747746, "loss": 0.0131, "step": 69700 }, { "epoch": 0.75, "learning_rate": 0.00018695920088214306, "loss": 0.0117, "step": 69710 }, { "epoch": 0.75, "learning_rate": 0.00018694298501654015, "loss": 0.0152, "step": 69720 }, { "epoch": 0.75, "learning_rate": 0.00018692676915093727, "loss": 0.0207, "step": 69730 }, { "epoch": 0.75, "learning_rate": 0.00018691055328533436, "loss": 0.0164, "step": 69740 }, { "epoch": 0.75, "learning_rate": 0.00018689433741973143, "loss": 0.0151, "step": 69750 }, { "epoch": 0.75, "learning_rate": 0.00018687812155412855, "loss": 0.0144, "step": 69760 }, { "epoch": 0.75, "learning_rate": 0.00018686190568852564, "loss": 0.0136, "step": 69770 }, { "epoch": 0.75, "learning_rate": 0.00018684568982292273, "loss": 0.0154, "step": 69780 }, { "epoch": 0.75, "learning_rate": 0.00018682947395731985, "loss": 0.016, "step": 69790 }, { "epoch": 0.75, "learning_rate": 0.00018681325809171692, "loss": 0.0153, "step": 69800 }, { "epoch": 0.75, "learning_rate": 0.000186797042226114, "loss": 0.0161, "step": 69810 }, { "epoch": 0.75, "learning_rate": 0.0001867808263605111, "loss": 0.0138, "step": 69820 }, { "epoch": 0.75, "learning_rate": 0.00018676461049490822, "loss": 0.0147, "step": 69830 }, { "epoch": 0.76, "learning_rate": 0.0001867483946293053, "loss": 0.0126, "step": 69840 }, { "epoch": 0.76, "learning_rate": 0.00018673217876370238, "loss": 0.015, "step": 69850 }, { "epoch": 0.76, "learning_rate": 0.0001867159628980995, "loss": 0.0157, "step": 69860 }, { "epoch": 0.76, "learning_rate": 0.0001866997470324966, "loss": 0.0169, "step": 69870 }, { "epoch": 0.76, "learning_rate": 0.00018668353116689366, "loss": 0.0154, "step": 69880 }, { "epoch": 0.76, "learning_rate": 0.00018666731530129075, "loss": 0.0149, "step": 69890 }, { "epoch": 0.76, "learning_rate": 0.00018665109943568787, "loss": 0.0166, "step": 69900 }, { "epoch": 0.76, "learning_rate": 0.00018663488357008497, "loss": 0.0135, "step": 69910 }, { "epoch": 0.76, "learning_rate": 0.00018661866770448203, "loss": 0.0141, "step": 69920 }, { "epoch": 0.76, "learning_rate": 0.00018660245183887915, "loss": 0.0171, "step": 69930 }, { "epoch": 0.76, "learning_rate": 0.00018658623597327624, "loss": 0.0174, "step": 69940 }, { "epoch": 0.76, "learning_rate": 0.00018657002010767334, "loss": 0.0164, "step": 69950 }, { "epoch": 0.76, "learning_rate": 0.0001865538042420704, "loss": 0.0143, "step": 69960 }, { "epoch": 0.76, "learning_rate": 0.00018653758837646752, "loss": 0.0146, "step": 69970 }, { "epoch": 0.76, "learning_rate": 0.00018652137251086461, "loss": 0.0164, "step": 69980 }, { "epoch": 0.76, "learning_rate": 0.00018650515664526173, "loss": 0.0153, "step": 69990 }, { "epoch": 0.76, "learning_rate": 0.0001864889407796588, "loss": 0.0136, "step": 70000 }, { "epoch": 0.76, "eval_cer": 0.9215364891415945, "eval_loss": 0.010723001323640347, "eval_runtime": 121.1995, "eval_samples_per_second": 16.502, "eval_steps_per_second": 4.125, "step": 70000 }, { "epoch": 0.76, "learning_rate": 0.0001864727249140559, "loss": 0.0151, "step": 70010 }, { "epoch": 0.76, "learning_rate": 0.00018645650904845299, "loss": 0.0163, "step": 70020 }, { "epoch": 0.76, "learning_rate": 0.0001864402931828501, "loss": 0.0143, "step": 70030 }, { "epoch": 0.76, "learning_rate": 0.00018642407731724717, "loss": 0.0143, "step": 70040 }, { "epoch": 0.76, "learning_rate": 0.00018640786145164426, "loss": 0.0166, "step": 70050 }, { "epoch": 0.76, "learning_rate": 0.00018639164558604138, "loss": 0.0174, "step": 70060 }, { "epoch": 0.76, "learning_rate": 0.00018637542972043848, "loss": 0.0161, "step": 70070 }, { "epoch": 0.76, "learning_rate": 0.00018635921385483554, "loss": 0.0142, "step": 70080 }, { "epoch": 0.76, "learning_rate": 0.00018634299798923263, "loss": 0.0147, "step": 70090 }, { "epoch": 0.76, "learning_rate": 0.00018632678212362975, "loss": 0.0124, "step": 70100 }, { "epoch": 0.76, "learning_rate": 0.00018631056625802685, "loss": 0.0161, "step": 70110 }, { "epoch": 0.76, "learning_rate": 0.0001862943503924239, "loss": 0.0172, "step": 70120 }, { "epoch": 0.76, "learning_rate": 0.00018627813452682103, "loss": 0.014, "step": 70130 }, { "epoch": 0.76, "learning_rate": 0.00018626191866121813, "loss": 0.0158, "step": 70140 }, { "epoch": 0.76, "learning_rate": 0.00018624570279561522, "loss": 0.0157, "step": 70150 }, { "epoch": 0.76, "learning_rate": 0.00018622948693001228, "loss": 0.0167, "step": 70160 }, { "epoch": 0.76, "learning_rate": 0.0001862132710644094, "loss": 0.017, "step": 70170 }, { "epoch": 0.76, "learning_rate": 0.0001861970551988065, "loss": 0.0134, "step": 70180 }, { "epoch": 0.76, "learning_rate": 0.0001861808393332036, "loss": 0.0149, "step": 70190 }, { "epoch": 0.76, "learning_rate": 0.00018616462346760068, "loss": 0.0189, "step": 70200 }, { "epoch": 0.76, "learning_rate": 0.00018614840760199777, "loss": 0.0172, "step": 70210 }, { "epoch": 0.76, "learning_rate": 0.00018613219173639487, "loss": 0.0142, "step": 70220 }, { "epoch": 0.76, "learning_rate": 0.000186115975870792, "loss": 0.0136, "step": 70230 }, { "epoch": 0.76, "learning_rate": 0.00018609976000518905, "loss": 0.0146, "step": 70240 }, { "epoch": 0.76, "learning_rate": 0.00018608354413958615, "loss": 0.0131, "step": 70250 }, { "epoch": 0.76, "learning_rate": 0.00018606732827398324, "loss": 0.0163, "step": 70260 }, { "epoch": 0.76, "learning_rate": 0.00018605111240838036, "loss": 0.0161, "step": 70270 }, { "epoch": 0.76, "learning_rate": 0.00018603489654277742, "loss": 0.0162, "step": 70280 }, { "epoch": 0.76, "learning_rate": 0.00018601868067717452, "loss": 0.0137, "step": 70290 }, { "epoch": 0.76, "learning_rate": 0.00018600246481157164, "loss": 0.0141, "step": 70300 }, { "epoch": 0.76, "learning_rate": 0.00018598624894596873, "loss": 0.0172, "step": 70310 }, { "epoch": 0.76, "learning_rate": 0.0001859700330803658, "loss": 0.0173, "step": 70320 }, { "epoch": 0.76, "learning_rate": 0.0001859538172147629, "loss": 0.0149, "step": 70330 }, { "epoch": 0.76, "learning_rate": 0.00018593760134916, "loss": 0.0136, "step": 70340 }, { "epoch": 0.76, "learning_rate": 0.0001859213854835571, "loss": 0.0139, "step": 70350 }, { "epoch": 0.76, "learning_rate": 0.00018590516961795417, "loss": 0.0133, "step": 70360 }, { "epoch": 0.76, "learning_rate": 0.00018588895375235129, "loss": 0.0153, "step": 70370 }, { "epoch": 0.76, "learning_rate": 0.00018587273788674838, "loss": 0.0122, "step": 70380 }, { "epoch": 0.76, "learning_rate": 0.00018585652202114547, "loss": 0.0164, "step": 70390 }, { "epoch": 0.76, "learning_rate": 0.00018584030615554256, "loss": 0.016, "step": 70400 }, { "epoch": 0.76, "learning_rate": 0.00018582409028993966, "loss": 0.0158, "step": 70410 }, { "epoch": 0.76, "learning_rate": 0.00018580787442433675, "loss": 0.0146, "step": 70420 }, { "epoch": 0.76, "learning_rate": 0.00018579165855873387, "loss": 0.0167, "step": 70430 }, { "epoch": 0.76, "learning_rate": 0.00018577544269313094, "loss": 0.0135, "step": 70440 }, { "epoch": 0.76, "learning_rate": 0.00018575922682752803, "loss": 0.0166, "step": 70450 }, { "epoch": 0.76, "learning_rate": 0.00018574301096192512, "loss": 0.0146, "step": 70460 }, { "epoch": 0.76, "learning_rate": 0.00018572679509632224, "loss": 0.0144, "step": 70470 }, { "epoch": 0.76, "learning_rate": 0.0001857105792307193, "loss": 0.0134, "step": 70480 }, { "epoch": 0.76, "learning_rate": 0.0001856943633651164, "loss": 0.0162, "step": 70490 }, { "epoch": 0.76, "learning_rate": 0.00018567814749951352, "loss": 0.0135, "step": 70500 }, { "epoch": 0.76, "learning_rate": 0.0001856619316339106, "loss": 0.0173, "step": 70510 }, { "epoch": 0.76, "learning_rate": 0.0001856457157683077, "loss": 0.0157, "step": 70520 }, { "epoch": 0.76, "learning_rate": 0.00018562949990270477, "loss": 0.013, "step": 70530 }, { "epoch": 0.76, "learning_rate": 0.0001856132840371019, "loss": 0.0154, "step": 70540 }, { "epoch": 0.76, "learning_rate": 0.00018559706817149898, "loss": 0.0152, "step": 70550 }, { "epoch": 0.76, "learning_rate": 0.00018558085230589608, "loss": 0.0151, "step": 70560 }, { "epoch": 0.76, "learning_rate": 0.00018556463644029317, "loss": 0.0126, "step": 70570 }, { "epoch": 0.76, "learning_rate": 0.00018554842057469026, "loss": 0.0146, "step": 70580 }, { "epoch": 0.76, "learning_rate": 0.00018553220470908735, "loss": 0.0128, "step": 70590 }, { "epoch": 0.76, "learning_rate": 0.00018551598884348447, "loss": 0.0129, "step": 70600 }, { "epoch": 0.76, "learning_rate": 0.00018549977297788154, "loss": 0.0156, "step": 70610 }, { "epoch": 0.76, "learning_rate": 0.00018548355711227863, "loss": 0.0152, "step": 70620 }, { "epoch": 0.76, "learning_rate": 0.00018546734124667575, "loss": 0.0116, "step": 70630 }, { "epoch": 0.76, "learning_rate": 0.00018545112538107284, "loss": 0.0165, "step": 70640 }, { "epoch": 0.76, "learning_rate": 0.0001854349095154699, "loss": 0.012, "step": 70650 }, { "epoch": 0.76, "learning_rate": 0.000185418693649867, "loss": 0.0157, "step": 70660 }, { "epoch": 0.76, "learning_rate": 0.00018540247778426412, "loss": 0.0145, "step": 70670 }, { "epoch": 0.76, "learning_rate": 0.00018538626191866122, "loss": 0.0139, "step": 70680 }, { "epoch": 0.76, "learning_rate": 0.00018537004605305828, "loss": 0.0147, "step": 70690 }, { "epoch": 0.76, "learning_rate": 0.0001853538301874554, "loss": 0.0161, "step": 70700 }, { "epoch": 0.76, "learning_rate": 0.0001853376143218525, "loss": 0.0144, "step": 70710 }, { "epoch": 0.76, "learning_rate": 0.00018532139845624959, "loss": 0.016, "step": 70720 }, { "epoch": 0.76, "learning_rate": 0.00018530518259064665, "loss": 0.0107, "step": 70730 }, { "epoch": 0.76, "learning_rate": 0.00018528896672504377, "loss": 0.0158, "step": 70740 }, { "epoch": 0.76, "learning_rate": 0.00018527275085944086, "loss": 0.0131, "step": 70750 }, { "epoch": 0.76, "learning_rate": 0.00018525653499383796, "loss": 0.0134, "step": 70760 }, { "epoch": 0.77, "learning_rate": 0.00018524031912823505, "loss": 0.0125, "step": 70770 }, { "epoch": 0.77, "learning_rate": 0.00018522410326263214, "loss": 0.0151, "step": 70780 }, { "epoch": 0.77, "learning_rate": 0.00018520788739702924, "loss": 0.0137, "step": 70790 }, { "epoch": 0.77, "learning_rate": 0.00018519167153142636, "loss": 0.0172, "step": 70800 }, { "epoch": 0.77, "learning_rate": 0.00018517545566582342, "loss": 0.0178, "step": 70810 }, { "epoch": 0.77, "learning_rate": 0.0001851592398002205, "loss": 0.0118, "step": 70820 }, { "epoch": 0.77, "learning_rate": 0.0001851430239346176, "loss": 0.0157, "step": 70830 }, { "epoch": 0.77, "learning_rate": 0.00018512680806901473, "loss": 0.0154, "step": 70840 }, { "epoch": 0.77, "learning_rate": 0.0001851105922034118, "loss": 0.0144, "step": 70850 }, { "epoch": 0.77, "learning_rate": 0.00018509437633780888, "loss": 0.0143, "step": 70860 }, { "epoch": 0.77, "learning_rate": 0.000185078160472206, "loss": 0.0146, "step": 70870 }, { "epoch": 0.77, "learning_rate": 0.0001850619446066031, "loss": 0.0169, "step": 70880 }, { "epoch": 0.77, "learning_rate": 0.00018504572874100016, "loss": 0.0135, "step": 70890 }, { "epoch": 0.77, "learning_rate": 0.00018502951287539726, "loss": 0.0157, "step": 70900 }, { "epoch": 0.77, "learning_rate": 0.00018501329700979438, "loss": 0.0137, "step": 70910 }, { "epoch": 0.77, "learning_rate": 0.00018499708114419147, "loss": 0.0139, "step": 70920 }, { "epoch": 0.77, "learning_rate": 0.00018498086527858853, "loss": 0.0151, "step": 70930 }, { "epoch": 0.77, "learning_rate": 0.00018496464941298565, "loss": 0.013, "step": 70940 }, { "epoch": 0.77, "learning_rate": 0.00018494843354738275, "loss": 0.0191, "step": 70950 }, { "epoch": 0.77, "learning_rate": 0.00018493221768177984, "loss": 0.0166, "step": 70960 }, { "epoch": 0.77, "learning_rate": 0.0001849160018161769, "loss": 0.0152, "step": 70970 }, { "epoch": 0.77, "learning_rate": 0.00018489978595057402, "loss": 0.0141, "step": 70980 }, { "epoch": 0.77, "learning_rate": 0.00018488357008497112, "loss": 0.0133, "step": 70990 }, { "epoch": 0.77, "learning_rate": 0.00018486735421936824, "loss": 0.0141, "step": 71000 }, { "epoch": 0.77, "eval_cer": 0.9215330147297689, "eval_loss": 0.010413131676614285, "eval_runtime": 121.2759, "eval_samples_per_second": 16.491, "eval_steps_per_second": 4.123, "step": 71000 }, { "epoch": 0.77, "learning_rate": 0.0001848511383537653, "loss": 0.0142, "step": 71010 }, { "epoch": 0.77, "learning_rate": 0.0001848349224881624, "loss": 0.0147, "step": 71020 }, { "epoch": 0.77, "learning_rate": 0.0001848187066225595, "loss": 0.0153, "step": 71030 }, { "epoch": 0.77, "learning_rate": 0.0001848024907569566, "loss": 0.0136, "step": 71040 }, { "epoch": 0.77, "learning_rate": 0.00018478627489135367, "loss": 0.0131, "step": 71050 }, { "epoch": 0.77, "learning_rate": 0.00018477005902575077, "loss": 0.0151, "step": 71060 }, { "epoch": 0.77, "learning_rate": 0.00018475384316014789, "loss": 0.0162, "step": 71070 }, { "epoch": 0.77, "learning_rate": 0.00018473762729454498, "loss": 0.0158, "step": 71080 }, { "epoch": 0.77, "learning_rate": 0.00018472141142894204, "loss": 0.013, "step": 71090 }, { "epoch": 0.77, "learning_rate": 0.00018470519556333914, "loss": 0.0165, "step": 71100 }, { "epoch": 0.77, "learning_rate": 0.00018468897969773626, "loss": 0.0152, "step": 71110 }, { "epoch": 0.77, "learning_rate": 0.00018467276383213335, "loss": 0.0134, "step": 71120 }, { "epoch": 0.77, "learning_rate": 0.00018465654796653042, "loss": 0.0163, "step": 71130 }, { "epoch": 0.77, "learning_rate": 0.00018464033210092754, "loss": 0.0142, "step": 71140 }, { "epoch": 0.77, "learning_rate": 0.00018462411623532463, "loss": 0.0123, "step": 71150 }, { "epoch": 0.77, "learning_rate": 0.00018460790036972172, "loss": 0.0162, "step": 71160 }, { "epoch": 0.77, "learning_rate": 0.0001845916845041188, "loss": 0.0157, "step": 71170 }, { "epoch": 0.77, "learning_rate": 0.0001845754686385159, "loss": 0.0128, "step": 71180 }, { "epoch": 0.77, "learning_rate": 0.000184559252772913, "loss": 0.0132, "step": 71190 }, { "epoch": 0.77, "learning_rate": 0.0001845430369073101, "loss": 0.017, "step": 71200 }, { "epoch": 0.77, "learning_rate": 0.00018452682104170718, "loss": 0.0152, "step": 71210 }, { "epoch": 0.77, "learning_rate": 0.00018451060517610428, "loss": 0.0138, "step": 71220 }, { "epoch": 0.77, "learning_rate": 0.00018449438931050137, "loss": 0.0169, "step": 71230 }, { "epoch": 0.77, "learning_rate": 0.0001844781734448985, "loss": 0.0155, "step": 71240 }, { "epoch": 0.77, "learning_rate": 0.00018446195757929558, "loss": 0.014, "step": 71250 }, { "epoch": 0.77, "learning_rate": 0.00018444574171369265, "loss": 0.014, "step": 71260 }, { "epoch": 0.77, "learning_rate": 0.00018442952584808974, "loss": 0.0162, "step": 71270 }, { "epoch": 0.77, "learning_rate": 0.00018441330998248686, "loss": 0.0115, "step": 71280 }, { "epoch": 0.77, "learning_rate": 0.00018439709411688395, "loss": 0.0136, "step": 71290 }, { "epoch": 0.77, "learning_rate": 0.00018438087825128102, "loss": 0.014, "step": 71300 }, { "epoch": 0.77, "learning_rate": 0.00018436466238567814, "loss": 0.0166, "step": 71310 }, { "epoch": 0.77, "learning_rate": 0.00018434844652007523, "loss": 0.0154, "step": 71320 }, { "epoch": 0.77, "learning_rate": 0.00018433223065447232, "loss": 0.0149, "step": 71330 }, { "epoch": 0.77, "learning_rate": 0.0001843160147888694, "loss": 0.0158, "step": 71340 }, { "epoch": 0.77, "learning_rate": 0.0001842997989232665, "loss": 0.0126, "step": 71350 }, { "epoch": 0.77, "learning_rate": 0.0001842835830576636, "loss": 0.0132, "step": 71360 }, { "epoch": 0.77, "learning_rate": 0.00018426736719206072, "loss": 0.0141, "step": 71370 }, { "epoch": 0.77, "learning_rate": 0.0001842511513264578, "loss": 0.0122, "step": 71380 }, { "epoch": 0.77, "learning_rate": 0.00018423493546085488, "loss": 0.0127, "step": 71390 }, { "epoch": 0.77, "learning_rate": 0.00018421871959525197, "loss": 0.0128, "step": 71400 }, { "epoch": 0.77, "learning_rate": 0.0001842025037296491, "loss": 0.0137, "step": 71410 }, { "epoch": 0.77, "learning_rate": 0.00018418628786404616, "loss": 0.0122, "step": 71420 }, { "epoch": 0.77, "learning_rate": 0.00018417007199844325, "loss": 0.0137, "step": 71430 }, { "epoch": 0.77, "learning_rate": 0.00018415385613284037, "loss": 0.0138, "step": 71440 }, { "epoch": 0.77, "learning_rate": 0.00018413764026723746, "loss": 0.0138, "step": 71450 }, { "epoch": 0.77, "learning_rate": 0.00018412142440163453, "loss": 0.0157, "step": 71460 }, { "epoch": 0.77, "learning_rate": 0.00018410520853603162, "loss": 0.0131, "step": 71470 }, { "epoch": 0.77, "learning_rate": 0.00018408899267042874, "loss": 0.0154, "step": 71480 }, { "epoch": 0.77, "learning_rate": 0.00018407277680482584, "loss": 0.0179, "step": 71490 }, { "epoch": 0.77, "learning_rate": 0.0001840565609392229, "loss": 0.0142, "step": 71500 }, { "epoch": 0.77, "learning_rate": 0.00018404034507362002, "loss": 0.0146, "step": 71510 }, { "epoch": 0.77, "learning_rate": 0.00018402412920801711, "loss": 0.0152, "step": 71520 }, { "epoch": 0.77, "learning_rate": 0.0001840079133424142, "loss": 0.0139, "step": 71530 }, { "epoch": 0.77, "learning_rate": 0.00018399169747681127, "loss": 0.0168, "step": 71540 }, { "epoch": 0.77, "learning_rate": 0.0001839754816112084, "loss": 0.0175, "step": 71550 }, { "epoch": 0.77, "learning_rate": 0.00018395926574560548, "loss": 0.0143, "step": 71560 }, { "epoch": 0.77, "learning_rate": 0.00018394304988000258, "loss": 0.0126, "step": 71570 }, { "epoch": 0.77, "learning_rate": 0.00018392683401439967, "loss": 0.0145, "step": 71580 }, { "epoch": 0.77, "learning_rate": 0.00018391061814879676, "loss": 0.0165, "step": 71590 }, { "epoch": 0.77, "learning_rate": 0.00018389440228319386, "loss": 0.0147, "step": 71600 }, { "epoch": 0.77, "learning_rate": 0.00018387818641759098, "loss": 0.0137, "step": 71610 }, { "epoch": 0.77, "learning_rate": 0.00018386197055198804, "loss": 0.014, "step": 71620 }, { "epoch": 0.77, "learning_rate": 0.00018384575468638513, "loss": 0.0119, "step": 71630 }, { "epoch": 0.77, "learning_rate": 0.00018382953882078225, "loss": 0.0148, "step": 71640 }, { "epoch": 0.77, "learning_rate": 0.00018381332295517935, "loss": 0.0137, "step": 71650 }, { "epoch": 0.77, "learning_rate": 0.0001837971070895764, "loss": 0.0147, "step": 71660 }, { "epoch": 0.77, "learning_rate": 0.0001837808912239735, "loss": 0.0112, "step": 71670 }, { "epoch": 0.77, "learning_rate": 0.00018376467535837062, "loss": 0.0149, "step": 71680 }, { "epoch": 0.78, "learning_rate": 0.00018374845949276772, "loss": 0.0154, "step": 71690 }, { "epoch": 0.78, "learning_rate": 0.00018373224362716478, "loss": 0.014, "step": 71700 }, { "epoch": 0.78, "learning_rate": 0.0001837160277615619, "loss": 0.0164, "step": 71710 }, { "epoch": 0.78, "learning_rate": 0.000183699811895959, "loss": 0.016, "step": 71720 }, { "epoch": 0.78, "learning_rate": 0.0001836835960303561, "loss": 0.0151, "step": 71730 }, { "epoch": 0.78, "learning_rate": 0.00018366738016475315, "loss": 0.0142, "step": 71740 }, { "epoch": 0.78, "learning_rate": 0.00018365116429915027, "loss": 0.0141, "step": 71750 }, { "epoch": 0.78, "learning_rate": 0.00018363494843354737, "loss": 0.0119, "step": 71760 }, { "epoch": 0.78, "learning_rate": 0.00018361873256794446, "loss": 0.0143, "step": 71770 }, { "epoch": 0.78, "learning_rate": 0.00018360251670234155, "loss": 0.0122, "step": 71780 }, { "epoch": 0.78, "learning_rate": 0.00018358630083673865, "loss": 0.0166, "step": 71790 }, { "epoch": 0.78, "learning_rate": 0.00018357008497113574, "loss": 0.0137, "step": 71800 }, { "epoch": 0.78, "learning_rate": 0.00018355386910553286, "loss": 0.0137, "step": 71810 }, { "epoch": 0.78, "learning_rate": 0.00018353765323992992, "loss": 0.0141, "step": 71820 }, { "epoch": 0.78, "learning_rate": 0.00018352143737432702, "loss": 0.0165, "step": 71830 }, { "epoch": 0.78, "learning_rate": 0.0001835052215087241, "loss": 0.0159, "step": 71840 }, { "epoch": 0.78, "learning_rate": 0.00018348900564312123, "loss": 0.0142, "step": 71850 }, { "epoch": 0.78, "learning_rate": 0.0001834727897775183, "loss": 0.015, "step": 71860 }, { "epoch": 0.78, "learning_rate": 0.0001834565739119154, "loss": 0.015, "step": 71870 }, { "epoch": 0.78, "learning_rate": 0.0001834403580463125, "loss": 0.0124, "step": 71880 }, { "epoch": 0.78, "learning_rate": 0.0001834241421807096, "loss": 0.0178, "step": 71890 }, { "epoch": 0.78, "learning_rate": 0.00018340792631510667, "loss": 0.0177, "step": 71900 }, { "epoch": 0.78, "learning_rate": 0.00018339171044950376, "loss": 0.0134, "step": 71910 }, { "epoch": 0.78, "learning_rate": 0.00018337549458390088, "loss": 0.0163, "step": 71920 }, { "epoch": 0.78, "learning_rate": 0.00018335927871829797, "loss": 0.0138, "step": 71930 }, { "epoch": 0.78, "learning_rate": 0.0001833430628526951, "loss": 0.0116, "step": 71940 }, { "epoch": 0.78, "learning_rate": 0.00018332684698709216, "loss": 0.014, "step": 71950 }, { "epoch": 0.78, "learning_rate": 0.00018331063112148925, "loss": 0.0142, "step": 71960 }, { "epoch": 0.78, "learning_rate": 0.00018329441525588634, "loss": 0.0154, "step": 71970 }, { "epoch": 0.78, "learning_rate": 0.00018327819939028346, "loss": 0.0139, "step": 71980 }, { "epoch": 0.78, "learning_rate": 0.00018326198352468053, "loss": 0.0194, "step": 71990 }, { "epoch": 0.78, "learning_rate": 0.00018324576765907762, "loss": 0.0217, "step": 72000 }, { "epoch": 0.78, "eval_cer": 0.9215503867888964, "eval_loss": 0.011484924703836441, "eval_runtime": 121.1843, "eval_samples_per_second": 16.504, "eval_steps_per_second": 4.126, "step": 72000 }, { "epoch": 0.78, "learning_rate": 0.00018322955179347474, "loss": 0.0165, "step": 72010 }, { "epoch": 0.78, "learning_rate": 0.00018321333592787183, "loss": 0.0157, "step": 72020 }, { "epoch": 0.78, "learning_rate": 0.0001831971200622689, "loss": 0.0161, "step": 72030 }, { "epoch": 0.78, "learning_rate": 0.000183180904196666, "loss": 0.0182, "step": 72040 }, { "epoch": 0.78, "learning_rate": 0.0001831646883310631, "loss": 0.0138, "step": 72050 }, { "epoch": 0.78, "learning_rate": 0.0001831484724654602, "loss": 0.0117, "step": 72060 }, { "epoch": 0.78, "learning_rate": 0.00018313225659985727, "loss": 0.0129, "step": 72070 }, { "epoch": 0.78, "learning_rate": 0.0001831160407342544, "loss": 0.018, "step": 72080 }, { "epoch": 0.78, "learning_rate": 0.00018309982486865148, "loss": 0.012, "step": 72090 }, { "epoch": 0.78, "learning_rate": 0.00018308360900304857, "loss": 0.0141, "step": 72100 }, { "epoch": 0.78, "learning_rate": 0.00018306739313744564, "loss": 0.0134, "step": 72110 }, { "epoch": 0.78, "learning_rate": 0.00018305117727184276, "loss": 0.0104, "step": 72120 }, { "epoch": 0.78, "learning_rate": 0.00018303496140623985, "loss": 0.0118, "step": 72130 }, { "epoch": 0.78, "learning_rate": 0.00018301874554063695, "loss": 0.0157, "step": 72140 }, { "epoch": 0.78, "learning_rate": 0.00018300252967503404, "loss": 0.0146, "step": 72150 }, { "epoch": 0.78, "learning_rate": 0.00018298631380943113, "loss": 0.0128, "step": 72160 }, { "epoch": 0.78, "learning_rate": 0.00018297009794382822, "loss": 0.014, "step": 72170 }, { "epoch": 0.78, "learning_rate": 0.00018295388207822534, "loss": 0.0126, "step": 72180 }, { "epoch": 0.78, "learning_rate": 0.0001829376662126224, "loss": 0.0152, "step": 72190 }, { "epoch": 0.78, "learning_rate": 0.0001829214503470195, "loss": 0.0129, "step": 72200 }, { "epoch": 0.78, "learning_rate": 0.0001829052344814166, "loss": 0.0163, "step": 72210 }, { "epoch": 0.78, "learning_rate": 0.00018288901861581371, "loss": 0.013, "step": 72220 }, { "epoch": 0.78, "learning_rate": 0.00018287280275021078, "loss": 0.0114, "step": 72230 }, { "epoch": 0.78, "learning_rate": 0.00018285658688460787, "loss": 0.0146, "step": 72240 }, { "epoch": 0.78, "learning_rate": 0.000182840371019005, "loss": 0.0128, "step": 72250 }, { "epoch": 0.78, "learning_rate": 0.00018282415515340209, "loss": 0.016, "step": 72260 }, { "epoch": 0.78, "learning_rate": 0.00018280793928779915, "loss": 0.016, "step": 72270 }, { "epoch": 0.78, "learning_rate": 0.00018279172342219624, "loss": 0.0175, "step": 72280 }, { "epoch": 0.78, "learning_rate": 0.00018277550755659336, "loss": 0.0146, "step": 72290 }, { "epoch": 0.78, "learning_rate": 0.00018275929169099046, "loss": 0.0137, "step": 72300 }, { "epoch": 0.78, "learning_rate": 0.00018274307582538752, "loss": 0.0104, "step": 72310 }, { "epoch": 0.78, "learning_rate": 0.00018272685995978464, "loss": 0.0152, "step": 72320 }, { "epoch": 0.78, "learning_rate": 0.00018271064409418173, "loss": 0.0158, "step": 72330 }, { "epoch": 0.78, "learning_rate": 0.00018269442822857883, "loss": 0.016, "step": 72340 }, { "epoch": 0.78, "learning_rate": 0.0001826782123629759, "loss": 0.0131, "step": 72350 }, { "epoch": 0.78, "learning_rate": 0.000182661996497373, "loss": 0.0259, "step": 72360 }, { "epoch": 0.78, "learning_rate": 0.0001826457806317701, "loss": 0.0172, "step": 72370 }, { "epoch": 0.78, "learning_rate": 0.00018262956476616723, "loss": 0.0156, "step": 72380 }, { "epoch": 0.78, "learning_rate": 0.0001826133489005643, "loss": 0.0194, "step": 72390 }, { "epoch": 0.78, "learning_rate": 0.00018259713303496138, "loss": 0.0151, "step": 72400 }, { "epoch": 0.78, "learning_rate": 0.00018258091716935848, "loss": 0.0188, "step": 72410 }, { "epoch": 0.78, "learning_rate": 0.0001825647013037556, "loss": 0.0157, "step": 72420 }, { "epoch": 0.78, "learning_rate": 0.00018254848543815266, "loss": 0.0165, "step": 72430 }, { "epoch": 0.78, "learning_rate": 0.00018253226957254975, "loss": 0.0153, "step": 72440 }, { "epoch": 0.78, "learning_rate": 0.00018251605370694687, "loss": 0.0157, "step": 72450 }, { "epoch": 0.78, "learning_rate": 0.00018249983784134397, "loss": 0.0193, "step": 72460 }, { "epoch": 0.78, "learning_rate": 0.00018248362197574103, "loss": 0.017, "step": 72470 }, { "epoch": 0.78, "learning_rate": 0.00018246740611013813, "loss": 0.0135, "step": 72480 }, { "epoch": 0.78, "learning_rate": 0.00018245119024453525, "loss": 0.0187, "step": 72490 }, { "epoch": 0.78, "learning_rate": 0.00018243497437893234, "loss": 0.0143, "step": 72500 }, { "epoch": 0.78, "learning_rate": 0.0001824187585133294, "loss": 0.0145, "step": 72510 }, { "epoch": 0.78, "learning_rate": 0.00018240254264772652, "loss": 0.0134, "step": 72520 }, { "epoch": 0.78, "learning_rate": 0.00018238632678212362, "loss": 0.0135, "step": 72530 }, { "epoch": 0.78, "learning_rate": 0.0001823701109165207, "loss": 0.0142, "step": 72540 }, { "epoch": 0.78, "learning_rate": 0.00018235389505091777, "loss": 0.016, "step": 72550 }, { "epoch": 0.78, "learning_rate": 0.0001823376791853149, "loss": 0.0154, "step": 72560 }, { "epoch": 0.78, "learning_rate": 0.000182321463319712, "loss": 0.0116, "step": 72570 }, { "epoch": 0.78, "learning_rate": 0.00018230524745410908, "loss": 0.0137, "step": 72580 }, { "epoch": 0.78, "learning_rate": 0.00018228903158850617, "loss": 0.0131, "step": 72590 }, { "epoch": 0.78, "learning_rate": 0.00018227281572290327, "loss": 0.015, "step": 72600 }, { "epoch": 0.78, "learning_rate": 0.00018225659985730036, "loss": 0.0128, "step": 72610 }, { "epoch": 0.79, "learning_rate": 0.00018224038399169748, "loss": 0.0185, "step": 72620 }, { "epoch": 0.79, "learning_rate": 0.00018222416812609454, "loss": 0.013, "step": 72630 }, { "epoch": 0.79, "learning_rate": 0.00018220795226049164, "loss": 0.0173, "step": 72640 }, { "epoch": 0.79, "learning_rate": 0.00018219173639488876, "loss": 0.0124, "step": 72650 }, { "epoch": 0.79, "learning_rate": 0.00018217552052928585, "loss": 0.0136, "step": 72660 }, { "epoch": 0.79, "learning_rate": 0.00018215930466368294, "loss": 0.0142, "step": 72670 }, { "epoch": 0.79, "learning_rate": 0.00018214308879808, "loss": 0.0168, "step": 72680 }, { "epoch": 0.79, "learning_rate": 0.00018212687293247713, "loss": 0.0155, "step": 72690 }, { "epoch": 0.79, "learning_rate": 0.00018211065706687422, "loss": 0.0141, "step": 72700 }, { "epoch": 0.79, "learning_rate": 0.0001820944412012713, "loss": 0.0136, "step": 72710 }, { "epoch": 0.79, "learning_rate": 0.0001820782253356684, "loss": 0.018, "step": 72720 }, { "epoch": 0.79, "learning_rate": 0.0001820620094700655, "loss": 0.0166, "step": 72730 }, { "epoch": 0.79, "learning_rate": 0.0001820457936044626, "loss": 0.0131, "step": 72740 }, { "epoch": 0.79, "learning_rate": 0.0001820295777388597, "loss": 0.0169, "step": 72750 }, { "epoch": 0.79, "learning_rate": 0.00018201336187325678, "loss": 0.0125, "step": 72760 }, { "epoch": 0.79, "learning_rate": 0.00018199714600765387, "loss": 0.0137, "step": 72770 }, { "epoch": 0.79, "learning_rate": 0.00018198093014205096, "loss": 0.024, "step": 72780 }, { "epoch": 0.79, "learning_rate": 0.00018196471427644808, "loss": 0.014, "step": 72790 }, { "epoch": 0.79, "learning_rate": 0.00018194849841084515, "loss": 0.0148, "step": 72800 }, { "epoch": 0.79, "learning_rate": 0.00018193228254524224, "loss": 0.0135, "step": 72810 }, { "epoch": 0.79, "learning_rate": 0.00018191606667963936, "loss": 0.0152, "step": 72820 }, { "epoch": 0.79, "learning_rate": 0.00018189985081403645, "loss": 0.0176, "step": 72830 }, { "epoch": 0.79, "learning_rate": 0.00018188363494843352, "loss": 0.0162, "step": 72840 }, { "epoch": 0.79, "learning_rate": 0.0001818674190828306, "loss": 0.0173, "step": 72850 }, { "epoch": 0.79, "learning_rate": 0.00018185120321722773, "loss": 0.0161, "step": 72860 }, { "epoch": 0.79, "learning_rate": 0.00018183498735162482, "loss": 0.014, "step": 72870 }, { "epoch": 0.79, "learning_rate": 0.0001818187714860219, "loss": 0.0132, "step": 72880 }, { "epoch": 0.79, "learning_rate": 0.000181802555620419, "loss": 0.0127, "step": 72890 }, { "epoch": 0.79, "learning_rate": 0.0001817863397548161, "loss": 0.0158, "step": 72900 }, { "epoch": 0.79, "learning_rate": 0.0001817701238892132, "loss": 0.0156, "step": 72910 }, { "epoch": 0.79, "learning_rate": 0.00018175390802361026, "loss": 0.0129, "step": 72920 }, { "epoch": 0.79, "learning_rate": 0.00018173769215800738, "loss": 0.0174, "step": 72930 }, { "epoch": 0.79, "learning_rate": 0.00018172147629240447, "loss": 0.0161, "step": 72940 }, { "epoch": 0.79, "learning_rate": 0.0001817052604268016, "loss": 0.0156, "step": 72950 }, { "epoch": 0.79, "learning_rate": 0.00018168904456119866, "loss": 0.0165, "step": 72960 }, { "epoch": 0.79, "learning_rate": 0.00018167282869559575, "loss": 0.0141, "step": 72970 }, { "epoch": 0.79, "learning_rate": 0.00018165661282999284, "loss": 0.0191, "step": 72980 }, { "epoch": 0.79, "learning_rate": 0.00018164039696438996, "loss": 0.0147, "step": 72990 }, { "epoch": 0.79, "learning_rate": 0.00018162418109878703, "loss": 0.012, "step": 73000 }, { "epoch": 0.79, "eval_cer": 0.9215382263475072, "eval_loss": 0.01048470288515091, "eval_runtime": 121.1149, "eval_samples_per_second": 16.513, "eval_steps_per_second": 4.128, "step": 73000 }, { "epoch": 0.79, "learning_rate": 0.00018160796523318412, "loss": 0.0164, "step": 73010 }, { "epoch": 0.79, "learning_rate": 0.00018159174936758124, "loss": 0.0129, "step": 73020 }, { "epoch": 0.79, "learning_rate": 0.00018157553350197834, "loss": 0.016, "step": 73030 }, { "epoch": 0.79, "learning_rate": 0.0001815593176363754, "loss": 0.0126, "step": 73040 }, { "epoch": 0.79, "learning_rate": 0.0001815431017707725, "loss": 0.014, "step": 73050 }, { "epoch": 0.79, "learning_rate": 0.0001815268859051696, "loss": 0.0162, "step": 73060 }, { "epoch": 0.79, "learning_rate": 0.0001815106700395667, "loss": 0.0144, "step": 73070 }, { "epoch": 0.79, "learning_rate": 0.00018149445417396377, "loss": 0.0123, "step": 73080 }, { "epoch": 0.79, "learning_rate": 0.0001814782383083609, "loss": 0.0132, "step": 73090 }, { "epoch": 0.79, "learning_rate": 0.00018146202244275798, "loss": 0.0133, "step": 73100 }, { "epoch": 0.79, "learning_rate": 0.00018144580657715508, "loss": 0.0148, "step": 73110 }, { "epoch": 0.79, "learning_rate": 0.00018142959071155214, "loss": 0.0137, "step": 73120 }, { "epoch": 0.79, "learning_rate": 0.00018141337484594926, "loss": 0.0135, "step": 73130 }, { "epoch": 0.79, "learning_rate": 0.00018139715898034636, "loss": 0.0159, "step": 73140 }, { "epoch": 0.79, "learning_rate": 0.00018138094311474345, "loss": 0.0135, "step": 73150 }, { "epoch": 0.79, "learning_rate": 0.00018136472724914054, "loss": 0.0154, "step": 73160 }, { "epoch": 0.79, "learning_rate": 0.00018134851138353763, "loss": 0.0132, "step": 73170 }, { "epoch": 0.79, "learning_rate": 0.00018133229551793473, "loss": 0.0129, "step": 73180 }, { "epoch": 0.79, "learning_rate": 0.00018131607965233185, "loss": 0.0133, "step": 73190 }, { "epoch": 0.79, "learning_rate": 0.0001812998637867289, "loss": 0.0138, "step": 73200 }, { "epoch": 0.79, "learning_rate": 0.000181283647921126, "loss": 0.0159, "step": 73210 }, { "epoch": 0.79, "learning_rate": 0.0001812674320555231, "loss": 0.0156, "step": 73220 }, { "epoch": 0.79, "learning_rate": 0.00018125121618992022, "loss": 0.0122, "step": 73230 }, { "epoch": 0.79, "learning_rate": 0.00018123500032431728, "loss": 0.018, "step": 73240 }, { "epoch": 0.79, "learning_rate": 0.00018121878445871438, "loss": 0.0208, "step": 73250 }, { "epoch": 0.79, "learning_rate": 0.0001812025685931115, "loss": 0.0182, "step": 73260 }, { "epoch": 0.79, "learning_rate": 0.0001811863527275086, "loss": 0.0142, "step": 73270 }, { "epoch": 0.79, "learning_rate": 0.00018117013686190565, "loss": 0.0143, "step": 73280 }, { "epoch": 0.79, "learning_rate": 0.00018115392099630275, "loss": 0.0186, "step": 73290 }, { "epoch": 0.79, "learning_rate": 0.00018113770513069987, "loss": 0.023, "step": 73300 }, { "epoch": 0.79, "learning_rate": 0.00018112148926509696, "loss": 0.0159, "step": 73310 }, { "epoch": 0.79, "learning_rate": 0.00018110527339949402, "loss": 0.0157, "step": 73320 }, { "epoch": 0.79, "learning_rate": 0.00018108905753389114, "loss": 0.0155, "step": 73330 }, { "epoch": 0.79, "learning_rate": 0.00018107284166828824, "loss": 0.0153, "step": 73340 }, { "epoch": 0.79, "learning_rate": 0.00018105662580268533, "loss": 0.0161, "step": 73350 }, { "epoch": 0.79, "learning_rate": 0.0001810404099370824, "loss": 0.0144, "step": 73360 }, { "epoch": 0.79, "learning_rate": 0.00018102419407147952, "loss": 0.0157, "step": 73370 }, { "epoch": 0.79, "learning_rate": 0.0001810079782058766, "loss": 0.0144, "step": 73380 }, { "epoch": 0.79, "learning_rate": 0.00018099176234027373, "loss": 0.0164, "step": 73390 }, { "epoch": 0.79, "learning_rate": 0.00018097554647467082, "loss": 0.0162, "step": 73400 }, { "epoch": 0.79, "learning_rate": 0.0001809593306090679, "loss": 0.0111, "step": 73410 }, { "epoch": 0.79, "learning_rate": 0.00018094311474346498, "loss": 0.0147, "step": 73420 }, { "epoch": 0.79, "learning_rate": 0.0001809268988778621, "loss": 0.0141, "step": 73430 }, { "epoch": 0.79, "learning_rate": 0.0001809106830122592, "loss": 0.0171, "step": 73440 }, { "epoch": 0.79, "learning_rate": 0.00018089446714665626, "loss": 0.013, "step": 73450 }, { "epoch": 0.79, "learning_rate": 0.00018087825128105338, "loss": 0.0158, "step": 73460 }, { "epoch": 0.79, "learning_rate": 0.00018086203541545047, "loss": 0.0125, "step": 73470 }, { "epoch": 0.79, "learning_rate": 0.00018084581954984756, "loss": 0.0136, "step": 73480 }, { "epoch": 0.79, "learning_rate": 0.00018082960368424463, "loss": 0.0148, "step": 73490 }, { "epoch": 0.79, "learning_rate": 0.00018081338781864175, "loss": 0.0134, "step": 73500 }, { "epoch": 0.79, "learning_rate": 0.00018079717195303884, "loss": 0.0147, "step": 73510 }, { "epoch": 0.79, "learning_rate": 0.00018078095608743593, "loss": 0.0143, "step": 73520 }, { "epoch": 0.79, "learning_rate": 0.00018076474022183303, "loss": 0.0147, "step": 73530 }, { "epoch": 0.8, "learning_rate": 0.00018074852435623012, "loss": 0.0164, "step": 73540 }, { "epoch": 0.8, "learning_rate": 0.0001807323084906272, "loss": 0.0164, "step": 73550 }, { "epoch": 0.8, "learning_rate": 0.00018071609262502433, "loss": 0.014, "step": 73560 }, { "epoch": 0.8, "learning_rate": 0.0001806998767594214, "loss": 0.0133, "step": 73570 }, { "epoch": 0.8, "learning_rate": 0.0001806836608938185, "loss": 0.0228, "step": 73580 }, { "epoch": 0.8, "learning_rate": 0.00018066744502821558, "loss": 0.0159, "step": 73590 }, { "epoch": 0.8, "learning_rate": 0.0001806512291626127, "loss": 0.0158, "step": 73600 }, { "epoch": 0.8, "learning_rate": 0.00018063501329700977, "loss": 0.017, "step": 73610 }, { "epoch": 0.8, "learning_rate": 0.00018061879743140686, "loss": 0.0132, "step": 73620 }, { "epoch": 0.8, "learning_rate": 0.00018060258156580398, "loss": 0.0129, "step": 73630 }, { "epoch": 0.8, "learning_rate": 0.00018058636570020107, "loss": 0.0122, "step": 73640 }, { "epoch": 0.8, "learning_rate": 0.00018057014983459814, "loss": 0.0179, "step": 73650 }, { "epoch": 0.8, "learning_rate": 0.00018055393396899526, "loss": 0.0205, "step": 73660 }, { "epoch": 0.8, "learning_rate": 0.00018053771810339235, "loss": 0.0151, "step": 73670 }, { "epoch": 0.8, "learning_rate": 0.00018052150223778944, "loss": 0.011, "step": 73680 }, { "epoch": 0.8, "learning_rate": 0.0001805052863721865, "loss": 0.0129, "step": 73690 }, { "epoch": 0.8, "learning_rate": 0.00018048907050658363, "loss": 0.0143, "step": 73700 }, { "epoch": 0.8, "learning_rate": 0.00018047285464098072, "loss": 0.013, "step": 73710 }, { "epoch": 0.8, "learning_rate": 0.00018045663877537782, "loss": 0.0107, "step": 73720 }, { "epoch": 0.8, "learning_rate": 0.0001804404229097749, "loss": 0.0156, "step": 73730 }, { "epoch": 0.8, "learning_rate": 0.000180424207044172, "loss": 0.0132, "step": 73740 }, { "epoch": 0.8, "learning_rate": 0.0001804079911785691, "loss": 0.0157, "step": 73750 }, { "epoch": 0.8, "learning_rate": 0.00018039177531296621, "loss": 0.0126, "step": 73760 }, { "epoch": 0.8, "learning_rate": 0.00018037555944736328, "loss": 0.0164, "step": 73770 }, { "epoch": 0.8, "learning_rate": 0.00018035934358176037, "loss": 0.0133, "step": 73780 }, { "epoch": 0.8, "learning_rate": 0.00018034312771615746, "loss": 0.0169, "step": 73790 }, { "epoch": 0.8, "learning_rate": 0.00018032691185055458, "loss": 0.0147, "step": 73800 }, { "epoch": 0.8, "learning_rate": 0.00018031069598495165, "loss": 0.0164, "step": 73810 }, { "epoch": 0.8, "learning_rate": 0.00018029448011934874, "loss": 0.0122, "step": 73820 }, { "epoch": 0.8, "learning_rate": 0.00018027826425374586, "loss": 0.0135, "step": 73830 }, { "epoch": 0.8, "learning_rate": 0.00018026204838814296, "loss": 0.017, "step": 73840 }, { "epoch": 0.8, "learning_rate": 0.00018024583252254002, "loss": 0.0137, "step": 73850 }, { "epoch": 0.8, "learning_rate": 0.00018022961665693711, "loss": 0.0141, "step": 73860 }, { "epoch": 0.8, "learning_rate": 0.00018021340079133423, "loss": 0.0156, "step": 73870 }, { "epoch": 0.8, "learning_rate": 0.00018019718492573133, "loss": 0.0123, "step": 73880 }, { "epoch": 0.8, "learning_rate": 0.0001801809690601284, "loss": 0.0148, "step": 73890 }, { "epoch": 0.8, "learning_rate": 0.0001801647531945255, "loss": 0.0125, "step": 73900 }, { "epoch": 0.8, "learning_rate": 0.0001801485373289226, "loss": 0.0146, "step": 73910 }, { "epoch": 0.8, "learning_rate": 0.0001801323214633197, "loss": 0.0161, "step": 73920 }, { "epoch": 0.8, "learning_rate": 0.00018011610559771676, "loss": 0.0117, "step": 73930 }, { "epoch": 0.8, "learning_rate": 0.00018009988973211388, "loss": 0.0155, "step": 73940 }, { "epoch": 0.8, "learning_rate": 0.00018008367386651098, "loss": 0.017, "step": 73950 }, { "epoch": 0.8, "learning_rate": 0.0001800674580009081, "loss": 0.0135, "step": 73960 }, { "epoch": 0.8, "learning_rate": 0.00018005124213530516, "loss": 0.0106, "step": 73970 }, { "epoch": 0.8, "learning_rate": 0.00018003502626970225, "loss": 0.0153, "step": 73980 }, { "epoch": 0.8, "learning_rate": 0.00018001881040409935, "loss": 0.0124, "step": 73990 }, { "epoch": 0.8, "learning_rate": 0.00018000259453849647, "loss": 0.0141, "step": 74000 }, { "epoch": 0.8, "eval_cer": 0.9215460437741146, "eval_loss": 0.010000753216445446, "eval_runtime": 121.1084, "eval_samples_per_second": 16.514, "eval_steps_per_second": 4.129, "step": 74000 }, { "epoch": 0.8, "learning_rate": 0.00017998637867289353, "loss": 0.011, "step": 74010 }, { "epoch": 0.8, "learning_rate": 0.00017997016280729063, "loss": 0.0165, "step": 74020 }, { "epoch": 0.8, "learning_rate": 0.00017995394694168774, "loss": 0.0151, "step": 74030 }, { "epoch": 0.8, "learning_rate": 0.00017993773107608484, "loss": 0.0138, "step": 74040 }, { "epoch": 0.8, "learning_rate": 0.0001799215152104819, "loss": 0.016, "step": 74050 }, { "epoch": 0.8, "learning_rate": 0.000179905299344879, "loss": 0.0189, "step": 74060 }, { "epoch": 0.8, "learning_rate": 0.00017988908347927612, "loss": 0.0123, "step": 74070 }, { "epoch": 0.8, "learning_rate": 0.0001798728676136732, "loss": 0.012, "step": 74080 }, { "epoch": 0.8, "learning_rate": 0.0001798566517480703, "loss": 0.0175, "step": 74090 }, { "epoch": 0.8, "learning_rate": 0.0001798404358824674, "loss": 0.0132, "step": 74100 }, { "epoch": 0.8, "learning_rate": 0.0001798242200168645, "loss": 0.0141, "step": 74110 }, { "epoch": 0.8, "learning_rate": 0.00017980800415126158, "loss": 0.0154, "step": 74120 }, { "epoch": 0.8, "learning_rate": 0.0001797917882856587, "loss": 0.0173, "step": 74130 }, { "epoch": 0.8, "learning_rate": 0.00017977557242005577, "loss": 0.0162, "step": 74140 }, { "epoch": 0.8, "learning_rate": 0.00017975935655445286, "loss": 0.0143, "step": 74150 }, { "epoch": 0.8, "learning_rate": 0.00017974314068884995, "loss": 0.0167, "step": 74160 }, { "epoch": 0.8, "learning_rate": 0.00017972692482324707, "loss": 0.0181, "step": 74170 }, { "epoch": 0.8, "learning_rate": 0.00017971070895764414, "loss": 0.0157, "step": 74180 }, { "epoch": 0.8, "learning_rate": 0.00017969449309204123, "loss": 0.0135, "step": 74190 }, { "epoch": 0.8, "learning_rate": 0.00017967827722643835, "loss": 0.0154, "step": 74200 }, { "epoch": 0.8, "learning_rate": 0.00017966206136083544, "loss": 0.014, "step": 74210 }, { "epoch": 0.8, "learning_rate": 0.0001796458454952325, "loss": 0.0159, "step": 74220 }, { "epoch": 0.8, "learning_rate": 0.0001796296296296296, "loss": 0.017, "step": 74230 }, { "epoch": 0.8, "learning_rate": 0.00017961341376402672, "loss": 0.0146, "step": 74240 }, { "epoch": 0.8, "learning_rate": 0.0001795971978984238, "loss": 0.013, "step": 74250 }, { "epoch": 0.8, "learning_rate": 0.00017958098203282088, "loss": 0.0147, "step": 74260 }, { "epoch": 0.8, "learning_rate": 0.000179564766167218, "loss": 0.0143, "step": 74270 }, { "epoch": 0.8, "learning_rate": 0.0001795485503016151, "loss": 0.0154, "step": 74280 }, { "epoch": 0.8, "learning_rate": 0.00017953233443601218, "loss": 0.0116, "step": 74290 }, { "epoch": 0.8, "learning_rate": 0.00017951611857040925, "loss": 0.0173, "step": 74300 }, { "epoch": 0.8, "learning_rate": 0.00017949990270480637, "loss": 0.0144, "step": 74310 }, { "epoch": 0.8, "learning_rate": 0.00017948368683920346, "loss": 0.0136, "step": 74320 }, { "epoch": 0.8, "learning_rate": 0.00017946747097360058, "loss": 0.0134, "step": 74330 }, { "epoch": 0.8, "learning_rate": 0.00017945125510799765, "loss": 0.0199, "step": 74340 }, { "epoch": 0.8, "learning_rate": 0.00017943503924239474, "loss": 0.0141, "step": 74350 }, { "epoch": 0.8, "learning_rate": 0.00017941882337679183, "loss": 0.0153, "step": 74360 }, { "epoch": 0.8, "learning_rate": 0.00017940260751118895, "loss": 0.014, "step": 74370 }, { "epoch": 0.8, "learning_rate": 0.00017938639164558602, "loss": 0.0145, "step": 74380 }, { "epoch": 0.8, "learning_rate": 0.0001793701757799831, "loss": 0.0147, "step": 74390 }, { "epoch": 0.8, "learning_rate": 0.00017935395991438023, "loss": 0.021, "step": 74400 }, { "epoch": 0.8, "learning_rate": 0.00017933774404877732, "loss": 0.0134, "step": 74410 }, { "epoch": 0.8, "learning_rate": 0.0001793215281831744, "loss": 0.0154, "step": 74420 }, { "epoch": 0.8, "learning_rate": 0.00017930531231757148, "loss": 0.0106, "step": 74430 }, { "epoch": 0.8, "learning_rate": 0.0001792890964519686, "loss": 0.0155, "step": 74440 }, { "epoch": 0.8, "learning_rate": 0.0001792728805863657, "loss": 0.0154, "step": 74450 }, { "epoch": 0.8, "learning_rate": 0.00017925666472076276, "loss": 0.0131, "step": 74460 }, { "epoch": 0.81, "learning_rate": 0.00017924044885515988, "loss": 0.0134, "step": 74470 }, { "epoch": 0.81, "learning_rate": 0.00017922423298955697, "loss": 0.0124, "step": 74480 }, { "epoch": 0.81, "learning_rate": 0.00017920801712395407, "loss": 0.0109, "step": 74490 }, { "epoch": 0.81, "learning_rate": 0.00017919180125835113, "loss": 0.0102, "step": 74500 }, { "epoch": 0.81, "learning_rate": 0.00017917558539274825, "loss": 0.0135, "step": 74510 }, { "epoch": 0.81, "learning_rate": 0.00017915936952714534, "loss": 0.0127, "step": 74520 }, { "epoch": 0.81, "learning_rate": 0.00017914315366154244, "loss": 0.013, "step": 74530 }, { "epoch": 0.81, "learning_rate": 0.00017912693779593953, "loss": 0.0127, "step": 74540 }, { "epoch": 0.81, "learning_rate": 0.00017911072193033662, "loss": 0.0142, "step": 74550 }, { "epoch": 0.81, "learning_rate": 0.00017909450606473371, "loss": 0.0168, "step": 74560 }, { "epoch": 0.81, "learning_rate": 0.00017907829019913083, "loss": 0.0161, "step": 74570 }, { "epoch": 0.81, "learning_rate": 0.0001790620743335279, "loss": 0.0118, "step": 74580 }, { "epoch": 0.81, "learning_rate": 0.000179045858467925, "loss": 0.0152, "step": 74590 }, { "epoch": 0.81, "learning_rate": 0.00017902964260232209, "loss": 0.0177, "step": 74600 }, { "epoch": 0.81, "learning_rate": 0.0001790134267367192, "loss": 0.0139, "step": 74610 }, { "epoch": 0.81, "learning_rate": 0.00017899721087111627, "loss": 0.0184, "step": 74620 }, { "epoch": 0.81, "learning_rate": 0.00017898099500551336, "loss": 0.0124, "step": 74630 }, { "epoch": 0.81, "learning_rate": 0.00017896477913991048, "loss": 0.0125, "step": 74640 }, { "epoch": 0.81, "learning_rate": 0.00017894856327430758, "loss": 0.0142, "step": 74650 }, { "epoch": 0.81, "learning_rate": 0.00017893234740870464, "loss": 0.0121, "step": 74660 }, { "epoch": 0.81, "learning_rate": 0.00017891613154310176, "loss": 0.0143, "step": 74670 }, { "epoch": 0.81, "learning_rate": 0.00017889991567749885, "loss": 0.0145, "step": 74680 }, { "epoch": 0.81, "learning_rate": 0.00017888369981189595, "loss": 0.0134, "step": 74690 }, { "epoch": 0.81, "learning_rate": 0.000178867483946293, "loss": 0.0129, "step": 74700 }, { "epoch": 0.81, "learning_rate": 0.00017885126808069013, "loss": 0.012, "step": 74710 }, { "epoch": 0.81, "learning_rate": 0.00017883505221508723, "loss": 0.0117, "step": 74720 }, { "epoch": 0.81, "learning_rate": 0.00017881883634948432, "loss": 0.0138, "step": 74730 }, { "epoch": 0.81, "learning_rate": 0.0001788026204838814, "loss": 0.0113, "step": 74740 }, { "epoch": 0.81, "learning_rate": 0.0001787864046182785, "loss": 0.016, "step": 74750 }, { "epoch": 0.81, "learning_rate": 0.0001787701887526756, "loss": 0.0116, "step": 74760 }, { "epoch": 0.81, "learning_rate": 0.00017875397288707272, "loss": 0.0122, "step": 74770 }, { "epoch": 0.81, "learning_rate": 0.00017873775702146978, "loss": 0.0142, "step": 74780 }, { "epoch": 0.81, "learning_rate": 0.00017872154115586687, "loss": 0.0135, "step": 74790 }, { "epoch": 0.81, "learning_rate": 0.00017870532529026397, "loss": 0.014, "step": 74800 }, { "epoch": 0.81, "learning_rate": 0.0001786891094246611, "loss": 0.0127, "step": 74810 }, { "epoch": 0.81, "learning_rate": 0.00017867289355905818, "loss": 0.0118, "step": 74820 }, { "epoch": 0.81, "learning_rate": 0.00017865667769345525, "loss": 0.0136, "step": 74830 }, { "epoch": 0.81, "learning_rate": 0.00017864046182785237, "loss": 0.0148, "step": 74840 }, { "epoch": 0.81, "learning_rate": 0.00017862424596224946, "loss": 0.0133, "step": 74850 }, { "epoch": 0.81, "learning_rate": 0.00017860803009664655, "loss": 0.0144, "step": 74860 }, { "epoch": 0.81, "learning_rate": 0.00017859181423104362, "loss": 0.0109, "step": 74870 }, { "epoch": 0.81, "learning_rate": 0.00017857559836544074, "loss": 0.0121, "step": 74880 }, { "epoch": 0.81, "learning_rate": 0.00017855938249983783, "loss": 0.012, "step": 74890 }, { "epoch": 0.81, "learning_rate": 0.00017854316663423492, "loss": 0.0141, "step": 74900 }, { "epoch": 0.81, "learning_rate": 0.00017852695076863201, "loss": 0.0132, "step": 74910 }, { "epoch": 0.81, "learning_rate": 0.0001785107349030291, "loss": 0.0172, "step": 74920 }, { "epoch": 0.81, "learning_rate": 0.0001784945190374262, "loss": 0.0129, "step": 74930 }, { "epoch": 0.81, "learning_rate": 0.00017847830317182332, "loss": 0.0128, "step": 74940 }, { "epoch": 0.81, "learning_rate": 0.00017846208730622039, "loss": 0.0146, "step": 74950 }, { "epoch": 0.81, "learning_rate": 0.00017844587144061748, "loss": 0.014, "step": 74960 }, { "epoch": 0.81, "learning_rate": 0.0001784296555750146, "loss": 0.0151, "step": 74970 }, { "epoch": 0.81, "learning_rate": 0.0001784134397094117, "loss": 0.0129, "step": 74980 }, { "epoch": 0.81, "learning_rate": 0.00017839722384380876, "loss": 0.014, "step": 74990 }, { "epoch": 0.81, "learning_rate": 0.00017838100797820585, "loss": 0.0136, "step": 75000 }, { "epoch": 0.81, "eval_cer": 0.9215417007593327, "eval_loss": 0.009637880139052868, "eval_runtime": 121.078, "eval_samples_per_second": 16.518, "eval_steps_per_second": 4.13, "step": 75000 }, { "epoch": 0.81, "learning_rate": 0.00017836479211260297, "loss": 0.0132, "step": 75010 }, { "epoch": 0.81, "learning_rate": 0.00017834857624700006, "loss": 0.0102, "step": 75020 }, { "epoch": 0.81, "learning_rate": 0.00017833236038139713, "loss": 0.0158, "step": 75030 }, { "epoch": 0.81, "learning_rate": 0.00017831614451579425, "loss": 0.0138, "step": 75040 }, { "epoch": 0.81, "learning_rate": 0.00017829992865019134, "loss": 0.0108, "step": 75050 }, { "epoch": 0.81, "learning_rate": 0.00017828371278458843, "loss": 0.0143, "step": 75060 }, { "epoch": 0.81, "learning_rate": 0.0001782674969189855, "loss": 0.0143, "step": 75070 }, { "epoch": 0.81, "learning_rate": 0.00017825128105338262, "loss": 0.0113, "step": 75080 }, { "epoch": 0.81, "learning_rate": 0.0001782350651877797, "loss": 0.0162, "step": 75090 }, { "epoch": 0.81, "learning_rate": 0.0001782188493221768, "loss": 0.0134, "step": 75100 }, { "epoch": 0.81, "learning_rate": 0.0001782026334565739, "loss": 0.0131, "step": 75110 }, { "epoch": 0.81, "learning_rate": 0.000178186417590971, "loss": 0.0137, "step": 75120 }, { "epoch": 0.81, "learning_rate": 0.00017817020172536808, "loss": 0.0118, "step": 75130 }, { "epoch": 0.81, "learning_rate": 0.0001781539858597652, "loss": 0.0129, "step": 75140 }, { "epoch": 0.81, "learning_rate": 0.00017813776999416227, "loss": 0.0145, "step": 75150 }, { "epoch": 0.81, "learning_rate": 0.00017812155412855936, "loss": 0.013, "step": 75160 }, { "epoch": 0.81, "learning_rate": 0.00017810533826295645, "loss": 0.0151, "step": 75170 }, { "epoch": 0.81, "learning_rate": 0.00017808912239735357, "loss": 0.0147, "step": 75180 }, { "epoch": 0.81, "learning_rate": 0.00017807290653175064, "loss": 0.0121, "step": 75190 }, { "epoch": 0.81, "learning_rate": 0.00017805669066614773, "loss": 0.0118, "step": 75200 }, { "epoch": 0.81, "learning_rate": 0.00017804047480054485, "loss": 0.0151, "step": 75210 }, { "epoch": 0.81, "learning_rate": 0.00017802425893494194, "loss": 0.0133, "step": 75220 }, { "epoch": 0.81, "learning_rate": 0.000178008043069339, "loss": 0.0151, "step": 75230 }, { "epoch": 0.81, "learning_rate": 0.0001779918272037361, "loss": 0.0136, "step": 75240 }, { "epoch": 0.81, "learning_rate": 0.00017797561133813322, "loss": 0.0121, "step": 75250 }, { "epoch": 0.81, "learning_rate": 0.00017795939547253032, "loss": 0.0132, "step": 75260 }, { "epoch": 0.81, "learning_rate": 0.00017794317960692738, "loss": 0.0176, "step": 75270 }, { "epoch": 0.81, "learning_rate": 0.0001779269637413245, "loss": 0.011, "step": 75280 }, { "epoch": 0.81, "learning_rate": 0.0001779107478757216, "loss": 0.0159, "step": 75290 }, { "epoch": 0.81, "learning_rate": 0.00017789453201011869, "loss": 0.0132, "step": 75300 }, { "epoch": 0.81, "learning_rate": 0.00017787831614451575, "loss": 0.013, "step": 75310 }, { "epoch": 0.81, "learning_rate": 0.00017786210027891287, "loss": 0.0126, "step": 75320 }, { "epoch": 0.81, "learning_rate": 0.00017784588441330996, "loss": 0.0134, "step": 75330 }, { "epoch": 0.81, "learning_rate": 0.00017782966854770708, "loss": 0.0145, "step": 75340 }, { "epoch": 0.81, "learning_rate": 0.00017781345268210415, "loss": 0.0151, "step": 75350 }, { "epoch": 0.81, "learning_rate": 0.00017779723681650124, "loss": 0.0139, "step": 75360 }, { "epoch": 0.81, "learning_rate": 0.00017778102095089834, "loss": 0.0174, "step": 75370 }, { "epoch": 0.81, "learning_rate": 0.00017776480508529546, "loss": 0.0153, "step": 75380 }, { "epoch": 0.82, "learning_rate": 0.00017774858921969252, "loss": 0.0114, "step": 75390 }, { "epoch": 0.82, "learning_rate": 0.0001777323733540896, "loss": 0.015, "step": 75400 }, { "epoch": 0.82, "learning_rate": 0.00017771615748848673, "loss": 0.0139, "step": 75410 }, { "epoch": 0.82, "learning_rate": 0.00017769994162288383, "loss": 0.0136, "step": 75420 }, { "epoch": 0.82, "learning_rate": 0.0001776837257572809, "loss": 0.013, "step": 75430 }, { "epoch": 0.82, "learning_rate": 0.00017766750989167798, "loss": 0.0161, "step": 75440 }, { "epoch": 0.82, "learning_rate": 0.0001776512940260751, "loss": 0.0125, "step": 75450 }, { "epoch": 0.82, "learning_rate": 0.0001776350781604722, "loss": 0.0155, "step": 75460 }, { "epoch": 0.82, "learning_rate": 0.00017761886229486926, "loss": 0.0119, "step": 75470 }, { "epoch": 0.82, "learning_rate": 0.00017760264642926638, "loss": 0.0159, "step": 75480 }, { "epoch": 0.82, "learning_rate": 0.00017758643056366348, "loss": 0.0124, "step": 75490 }, { "epoch": 0.82, "learning_rate": 0.00017757021469806057, "loss": 0.0145, "step": 75500 }, { "epoch": 0.82, "learning_rate": 0.00017755399883245763, "loss": 0.0131, "step": 75510 }, { "epoch": 0.82, "learning_rate": 0.00017753778296685475, "loss": 0.0108, "step": 75520 }, { "epoch": 0.82, "learning_rate": 0.00017752156710125185, "loss": 0.0132, "step": 75530 }, { "epoch": 0.82, "learning_rate": 0.00017750535123564894, "loss": 0.015, "step": 75540 }, { "epoch": 0.82, "learning_rate": 0.00017748913537004606, "loss": 0.0155, "step": 75550 }, { "epoch": 0.82, "learning_rate": 0.00017747291950444312, "loss": 0.0145, "step": 75560 }, { "epoch": 0.82, "learning_rate": 0.00017745670363884022, "loss": 0.014, "step": 75570 }, { "epoch": 0.82, "learning_rate": 0.00017744048777323734, "loss": 0.0142, "step": 75580 }, { "epoch": 0.82, "learning_rate": 0.00017742427190763443, "loss": 0.0143, "step": 75590 }, { "epoch": 0.82, "learning_rate": 0.0001774080560420315, "loss": 0.0136, "step": 75600 }, { "epoch": 0.82, "learning_rate": 0.0001773918401764286, "loss": 0.0169, "step": 75610 }, { "epoch": 0.82, "learning_rate": 0.0001773756243108257, "loss": 0.0149, "step": 75620 }, { "epoch": 0.82, "learning_rate": 0.0001773594084452228, "loss": 0.0161, "step": 75630 }, { "epoch": 0.82, "learning_rate": 0.00017734319257961987, "loss": 0.0129, "step": 75640 }, { "epoch": 0.82, "learning_rate": 0.00017732697671401699, "loss": 0.0161, "step": 75650 }, { "epoch": 0.82, "learning_rate": 0.00017731076084841408, "loss": 0.013, "step": 75660 }, { "epoch": 0.82, "learning_rate": 0.00017729454498281117, "loss": 0.0147, "step": 75670 }, { "epoch": 0.82, "learning_rate": 0.00017727832911720826, "loss": 0.0133, "step": 75680 }, { "epoch": 0.82, "learning_rate": 0.00017726211325160536, "loss": 0.0132, "step": 75690 }, { "epoch": 0.82, "learning_rate": 0.00017724589738600245, "loss": 0.0147, "step": 75700 }, { "epoch": 0.82, "learning_rate": 0.00017722968152039957, "loss": 0.0164, "step": 75710 }, { "epoch": 0.82, "learning_rate": 0.00017721346565479664, "loss": 0.0121, "step": 75720 }, { "epoch": 0.82, "learning_rate": 0.00017719724978919373, "loss": 0.0151, "step": 75730 }, { "epoch": 0.82, "learning_rate": 0.00017718103392359082, "loss": 0.0128, "step": 75740 }, { "epoch": 0.82, "learning_rate": 0.00017716481805798794, "loss": 0.0185, "step": 75750 }, { "epoch": 0.82, "learning_rate": 0.000177148602192385, "loss": 0.0138, "step": 75760 }, { "epoch": 0.82, "learning_rate": 0.0001771323863267821, "loss": 0.016, "step": 75770 }, { "epoch": 0.82, "learning_rate": 0.00017711617046117922, "loss": 0.0157, "step": 75780 }, { "epoch": 0.82, "learning_rate": 0.0001770999545955763, "loss": 0.0155, "step": 75790 }, { "epoch": 0.82, "learning_rate": 0.00017708373872997338, "loss": 0.0152, "step": 75800 }, { "epoch": 0.82, "learning_rate": 0.00017706752286437047, "loss": 0.0119, "step": 75810 }, { "epoch": 0.82, "learning_rate": 0.0001770513069987676, "loss": 0.0144, "step": 75820 }, { "epoch": 0.82, "learning_rate": 0.00017703509113316468, "loss": 0.0122, "step": 75830 }, { "epoch": 0.82, "learning_rate": 0.00017701887526756175, "loss": 0.0135, "step": 75840 }, { "epoch": 0.82, "learning_rate": 0.00017700265940195887, "loss": 0.0162, "step": 75850 }, { "epoch": 0.82, "learning_rate": 0.00017698644353635596, "loss": 0.0155, "step": 75860 }, { "epoch": 0.82, "learning_rate": 0.00017697022767075305, "loss": 0.0162, "step": 75870 }, { "epoch": 0.82, "learning_rate": 0.00017695401180515012, "loss": 0.0134, "step": 75880 }, { "epoch": 0.82, "learning_rate": 0.00017693779593954724, "loss": 0.0137, "step": 75890 }, { "epoch": 0.82, "learning_rate": 0.00017692158007394433, "loss": 0.0124, "step": 75900 }, { "epoch": 0.82, "learning_rate": 0.00017690536420834142, "loss": 0.0131, "step": 75910 }, { "epoch": 0.82, "learning_rate": 0.00017688914834273852, "loss": 0.0111, "step": 75920 }, { "epoch": 0.82, "learning_rate": 0.0001768729324771356, "loss": 0.0108, "step": 75930 }, { "epoch": 0.82, "learning_rate": 0.0001768567166115327, "loss": 0.0144, "step": 75940 }, { "epoch": 0.82, "learning_rate": 0.00017684050074592982, "loss": 0.0115, "step": 75950 }, { "epoch": 0.82, "learning_rate": 0.0001768242848803269, "loss": 0.0123, "step": 75960 }, { "epoch": 0.82, "learning_rate": 0.00017680806901472398, "loss": 0.0141, "step": 75970 }, { "epoch": 0.82, "learning_rate": 0.0001767918531491211, "loss": 0.0122, "step": 75980 }, { "epoch": 0.82, "learning_rate": 0.0001767756372835182, "loss": 0.0178, "step": 75990 }, { "epoch": 0.82, "learning_rate": 0.00017675942141791526, "loss": 0.0106, "step": 76000 }, { "epoch": 0.82, "eval_cer": 0.9215929483337589, "eval_loss": 0.010436671786010265, "eval_runtime": 121.1923, "eval_samples_per_second": 16.503, "eval_steps_per_second": 4.126, "step": 76000 }, { "epoch": 0.82, "learning_rate": 0.00017674320555231235, "loss": 0.0147, "step": 76010 }, { "epoch": 0.82, "learning_rate": 0.00017672698968670947, "loss": 0.0184, "step": 76020 }, { "epoch": 0.82, "learning_rate": 0.00017671077382110656, "loss": 0.0247, "step": 76030 }, { "epoch": 0.82, "learning_rate": 0.00017669455795550363, "loss": 0.0145, "step": 76040 }, { "epoch": 0.82, "learning_rate": 0.00017667834208990075, "loss": 0.0135, "step": 76050 }, { "epoch": 0.82, "learning_rate": 0.00017666212622429784, "loss": 0.0151, "step": 76060 }, { "epoch": 0.82, "learning_rate": 0.00017664591035869494, "loss": 0.013, "step": 76070 }, { "epoch": 0.82, "learning_rate": 0.000176629694493092, "loss": 0.016, "step": 76080 }, { "epoch": 0.82, "learning_rate": 0.00017661347862748912, "loss": 0.0136, "step": 76090 }, { "epoch": 0.82, "learning_rate": 0.00017659726276188621, "loss": 0.0135, "step": 76100 }, { "epoch": 0.82, "learning_rate": 0.0001765810468962833, "loss": 0.0165, "step": 76110 }, { "epoch": 0.82, "learning_rate": 0.0001765648310306804, "loss": 0.016, "step": 76120 }, { "epoch": 0.82, "learning_rate": 0.0001765486151650775, "loss": 0.0134, "step": 76130 }, { "epoch": 0.82, "learning_rate": 0.00017653239929947458, "loss": 0.0138, "step": 76140 }, { "epoch": 0.82, "learning_rate": 0.0001765161834338717, "loss": 0.0153, "step": 76150 }, { "epoch": 0.82, "learning_rate": 0.00017649996756826877, "loss": 0.016, "step": 76160 }, { "epoch": 0.82, "learning_rate": 0.00017648375170266586, "loss": 0.0143, "step": 76170 }, { "epoch": 0.82, "learning_rate": 0.00017646753583706296, "loss": 0.0148, "step": 76180 }, { "epoch": 0.82, "learning_rate": 0.00017645131997146008, "loss": 0.017, "step": 76190 }, { "epoch": 0.82, "learning_rate": 0.00017643510410585714, "loss": 0.0166, "step": 76200 }, { "epoch": 0.82, "learning_rate": 0.00017641888824025423, "loss": 0.0155, "step": 76210 }, { "epoch": 0.82, "learning_rate": 0.00017640267237465135, "loss": 0.0167, "step": 76220 }, { "epoch": 0.82, "learning_rate": 0.00017638645650904845, "loss": 0.0202, "step": 76230 }, { "epoch": 0.82, "learning_rate": 0.0001763702406434455, "loss": 0.0136, "step": 76240 }, { "epoch": 0.82, "learning_rate": 0.0001763540247778426, "loss": 0.0181, "step": 76250 }, { "epoch": 0.82, "learning_rate": 0.00017633780891223972, "loss": 0.0112, "step": 76260 }, { "epoch": 0.82, "learning_rate": 0.00017632159304663682, "loss": 0.0164, "step": 76270 }, { "epoch": 0.82, "learning_rate": 0.00017630537718103394, "loss": 0.0131, "step": 76280 }, { "epoch": 0.82, "learning_rate": 0.000176289161315431, "loss": 0.0133, "step": 76290 }, { "epoch": 0.82, "learning_rate": 0.0001762729454498281, "loss": 0.0149, "step": 76300 }, { "epoch": 0.82, "learning_rate": 0.0001762567295842252, "loss": 0.0133, "step": 76310 }, { "epoch": 0.83, "learning_rate": 0.0001762405137186223, "loss": 0.015, "step": 76320 }, { "epoch": 0.83, "learning_rate": 0.00017622429785301937, "loss": 0.0149, "step": 76330 }, { "epoch": 0.83, "learning_rate": 0.00017620808198741647, "loss": 0.0138, "step": 76340 }, { "epoch": 0.83, "learning_rate": 0.0001761918661218136, "loss": 0.0187, "step": 76350 }, { "epoch": 0.83, "learning_rate": 0.00017617565025621068, "loss": 0.0154, "step": 76360 }, { "epoch": 0.83, "learning_rate": 0.00017615943439060775, "loss": 0.0169, "step": 76370 }, { "epoch": 0.83, "learning_rate": 0.00017614321852500484, "loss": 0.0139, "step": 76380 }, { "epoch": 0.83, "learning_rate": 0.00017612700265940196, "loss": 0.0165, "step": 76390 }, { "epoch": 0.83, "learning_rate": 0.00017611078679379905, "loss": 0.014, "step": 76400 }, { "epoch": 0.83, "learning_rate": 0.00017609457092819612, "loss": 0.0139, "step": 76410 }, { "epoch": 0.83, "learning_rate": 0.00017607835506259324, "loss": 0.0125, "step": 76420 }, { "epoch": 0.83, "learning_rate": 0.00017606213919699033, "loss": 0.0145, "step": 76430 }, { "epoch": 0.83, "learning_rate": 0.00017604592333138742, "loss": 0.0139, "step": 76440 }, { "epoch": 0.83, "learning_rate": 0.0001760297074657845, "loss": 0.0135, "step": 76450 }, { "epoch": 0.83, "learning_rate": 0.0001760134916001816, "loss": 0.0128, "step": 76460 }, { "epoch": 0.83, "learning_rate": 0.0001759972757345787, "loss": 0.013, "step": 76470 }, { "epoch": 0.83, "learning_rate": 0.0001759810598689758, "loss": 0.0151, "step": 76480 }, { "epoch": 0.83, "learning_rate": 0.00017596484400337289, "loss": 0.0106, "step": 76490 }, { "epoch": 0.83, "learning_rate": 0.00017594862813776998, "loss": 0.0135, "step": 76500 }, { "epoch": 0.83, "learning_rate": 0.00017593241227216707, "loss": 0.0172, "step": 76510 }, { "epoch": 0.83, "learning_rate": 0.0001759161964065642, "loss": 0.014, "step": 76520 }, { "epoch": 0.83, "learning_rate": 0.00017589998054096126, "loss": 0.0116, "step": 76530 }, { "epoch": 0.83, "learning_rate": 0.00017588376467535835, "loss": 0.0169, "step": 76540 }, { "epoch": 0.83, "learning_rate": 0.00017586754880975544, "loss": 0.0142, "step": 76550 }, { "epoch": 0.83, "learning_rate": 0.00017585133294415256, "loss": 0.014, "step": 76560 }, { "epoch": 0.83, "learning_rate": 0.00017583511707854963, "loss": 0.0139, "step": 76570 }, { "epoch": 0.83, "learning_rate": 0.00017581890121294672, "loss": 0.0128, "step": 76580 }, { "epoch": 0.83, "learning_rate": 0.00017580268534734384, "loss": 0.0113, "step": 76590 }, { "epoch": 0.83, "learning_rate": 0.00017578646948174093, "loss": 0.0116, "step": 76600 }, { "epoch": 0.83, "learning_rate": 0.000175770253616138, "loss": 0.0126, "step": 76610 }, { "epoch": 0.83, "learning_rate": 0.0001757540377505351, "loss": 0.0133, "step": 76620 }, { "epoch": 0.83, "learning_rate": 0.0001757378218849322, "loss": 0.0122, "step": 76630 }, { "epoch": 0.83, "learning_rate": 0.0001757216060193293, "loss": 0.0129, "step": 76640 }, { "epoch": 0.83, "learning_rate": 0.00017570539015372637, "loss": 0.0119, "step": 76650 }, { "epoch": 0.83, "learning_rate": 0.0001756891742881235, "loss": 0.0127, "step": 76660 }, { "epoch": 0.83, "learning_rate": 0.00017567295842252058, "loss": 0.0141, "step": 76670 }, { "epoch": 0.83, "learning_rate": 0.00017565674255691767, "loss": 0.0122, "step": 76680 }, { "epoch": 0.83, "learning_rate": 0.00017564052669131474, "loss": 0.0148, "step": 76690 }, { "epoch": 0.83, "learning_rate": 0.00017562431082571186, "loss": 0.013, "step": 76700 }, { "epoch": 0.83, "learning_rate": 0.00017560809496010895, "loss": 0.0151, "step": 76710 }, { "epoch": 0.83, "learning_rate": 0.00017559187909450607, "loss": 0.0105, "step": 76720 }, { "epoch": 0.83, "learning_rate": 0.00017557566322890314, "loss": 0.0156, "step": 76730 }, { "epoch": 0.83, "learning_rate": 0.00017555944736330023, "loss": 0.0158, "step": 76740 }, { "epoch": 0.83, "learning_rate": 0.00017554323149769732, "loss": 0.0158, "step": 76750 }, { "epoch": 0.83, "learning_rate": 0.00017552701563209444, "loss": 0.0175, "step": 76760 }, { "epoch": 0.83, "learning_rate": 0.0001755107997664915, "loss": 0.0163, "step": 76770 }, { "epoch": 0.83, "learning_rate": 0.0001754945839008886, "loss": 0.0167, "step": 76780 }, { "epoch": 0.83, "learning_rate": 0.00017547836803528572, "loss": 0.0137, "step": 76790 }, { "epoch": 0.83, "learning_rate": 0.00017546215216968281, "loss": 0.0138, "step": 76800 }, { "epoch": 0.83, "learning_rate": 0.00017544593630407988, "loss": 0.0118, "step": 76810 }, { "epoch": 0.83, "learning_rate": 0.00017542972043847697, "loss": 0.0181, "step": 76820 }, { "epoch": 0.83, "learning_rate": 0.0001754135045728741, "loss": 0.0137, "step": 76830 }, { "epoch": 0.83, "learning_rate": 0.00017539728870727119, "loss": 0.0117, "step": 76840 }, { "epoch": 0.83, "learning_rate": 0.00017538107284166825, "loss": 0.0143, "step": 76850 }, { "epoch": 0.83, "learning_rate": 0.00017536485697606537, "loss": 0.0152, "step": 76860 }, { "epoch": 0.83, "learning_rate": 0.00017534864111046246, "loss": 0.014, "step": 76870 }, { "epoch": 0.83, "learning_rate": 0.00017533242524485956, "loss": 0.0156, "step": 76880 }, { "epoch": 0.83, "learning_rate": 0.00017531620937925662, "loss": 0.0157, "step": 76890 }, { "epoch": 0.83, "learning_rate": 0.00017529999351365374, "loss": 0.0175, "step": 76900 }, { "epoch": 0.83, "learning_rate": 0.00017528377764805083, "loss": 0.0119, "step": 76910 }, { "epoch": 0.83, "learning_rate": 0.00017526756178244793, "loss": 0.0145, "step": 76920 }, { "epoch": 0.83, "learning_rate": 0.00017525134591684502, "loss": 0.0162, "step": 76930 }, { "epoch": 0.83, "learning_rate": 0.0001752351300512421, "loss": 0.0158, "step": 76940 }, { "epoch": 0.83, "learning_rate": 0.0001752189141856392, "loss": 0.0135, "step": 76950 }, { "epoch": 0.83, "learning_rate": 0.00017520269832003633, "loss": 0.0145, "step": 76960 }, { "epoch": 0.83, "learning_rate": 0.00017518648245443342, "loss": 0.0117, "step": 76970 }, { "epoch": 0.83, "learning_rate": 0.00017517026658883048, "loss": 0.0156, "step": 76980 }, { "epoch": 0.83, "learning_rate": 0.0001751540507232276, "loss": 0.0163, "step": 76990 }, { "epoch": 0.83, "learning_rate": 0.0001751378348576247, "loss": 0.0176, "step": 77000 }, { "epoch": 0.83, "eval_cer": 0.9215825250982824, "eval_loss": 0.010247960686683655, "eval_runtime": 121.2734, "eval_samples_per_second": 16.492, "eval_steps_per_second": 4.123, "step": 77000 }, { "epoch": 0.83, "learning_rate": 0.0001751216189920218, "loss": 0.0163, "step": 77010 }, { "epoch": 0.83, "learning_rate": 0.00017510540312641885, "loss": 0.0138, "step": 77020 }, { "epoch": 0.83, "learning_rate": 0.00017508918726081597, "loss": 0.0126, "step": 77030 }, { "epoch": 0.83, "learning_rate": 0.00017507297139521307, "loss": 0.013, "step": 77040 }, { "epoch": 0.83, "learning_rate": 0.00017505675552961016, "loss": 0.0125, "step": 77050 }, { "epoch": 0.83, "learning_rate": 0.00017504053966400725, "loss": 0.0128, "step": 77060 }, { "epoch": 0.83, "learning_rate": 0.00017502432379840435, "loss": 0.0136, "step": 77070 }, { "epoch": 0.83, "learning_rate": 0.00017500810793280144, "loss": 0.0147, "step": 77080 }, { "epoch": 0.83, "learning_rate": 0.00017499189206719856, "loss": 0.0115, "step": 77090 }, { "epoch": 0.83, "learning_rate": 0.00017497567620159562, "loss": 0.0133, "step": 77100 }, { "epoch": 0.83, "learning_rate": 0.00017495946033599272, "loss": 0.0174, "step": 77110 }, { "epoch": 0.83, "learning_rate": 0.0001749432444703898, "loss": 0.0129, "step": 77120 }, { "epoch": 0.83, "learning_rate": 0.00017492702860478693, "loss": 0.0144, "step": 77130 }, { "epoch": 0.83, "learning_rate": 0.000174910812739184, "loss": 0.0107, "step": 77140 }, { "epoch": 0.83, "learning_rate": 0.0001748945968735811, "loss": 0.0128, "step": 77150 }, { "epoch": 0.83, "learning_rate": 0.0001748783810079782, "loss": 0.0147, "step": 77160 }, { "epoch": 0.83, "learning_rate": 0.0001748621651423753, "loss": 0.0121, "step": 77170 }, { "epoch": 0.83, "learning_rate": 0.00017484594927677237, "loss": 0.0129, "step": 77180 }, { "epoch": 0.83, "learning_rate": 0.00017482973341116946, "loss": 0.0143, "step": 77190 }, { "epoch": 0.83, "learning_rate": 0.00017481351754556658, "loss": 0.0123, "step": 77200 }, { "epoch": 0.83, "learning_rate": 0.00017479730167996367, "loss": 0.0143, "step": 77210 }, { "epoch": 0.83, "learning_rate": 0.00017478108581436074, "loss": 0.0141, "step": 77220 }, { "epoch": 0.83, "learning_rate": 0.00017476486994875786, "loss": 0.0149, "step": 77230 }, { "epoch": 0.84, "learning_rate": 0.00017474865408315495, "loss": 0.0141, "step": 77240 }, { "epoch": 0.84, "learning_rate": 0.00017473243821755204, "loss": 0.0166, "step": 77250 }, { "epoch": 0.84, "learning_rate": 0.0001747162223519491, "loss": 0.015, "step": 77260 }, { "epoch": 0.84, "learning_rate": 0.00017470000648634623, "loss": 0.015, "step": 77270 }, { "epoch": 0.84, "learning_rate": 0.00017468379062074332, "loss": 0.014, "step": 77280 }, { "epoch": 0.84, "learning_rate": 0.00017466757475514044, "loss": 0.014, "step": 77290 }, { "epoch": 0.84, "learning_rate": 0.0001746513588895375, "loss": 0.0139, "step": 77300 }, { "epoch": 0.84, "learning_rate": 0.0001746351430239346, "loss": 0.0168, "step": 77310 }, { "epoch": 0.84, "learning_rate": 0.0001746189271583317, "loss": 0.0144, "step": 77320 }, { "epoch": 0.84, "learning_rate": 0.0001746027112927288, "loss": 0.0118, "step": 77330 }, { "epoch": 0.84, "learning_rate": 0.00017458649542712588, "loss": 0.0151, "step": 77340 }, { "epoch": 0.84, "learning_rate": 0.00017457027956152297, "loss": 0.0148, "step": 77350 }, { "epoch": 0.84, "learning_rate": 0.0001745540636959201, "loss": 0.0147, "step": 77360 }, { "epoch": 0.84, "learning_rate": 0.00017453784783031718, "loss": 0.0174, "step": 77370 }, { "epoch": 0.84, "learning_rate": 0.00017452163196471425, "loss": 0.0139, "step": 77380 }, { "epoch": 0.84, "learning_rate": 0.00017450541609911134, "loss": 0.0139, "step": 77390 }, { "epoch": 0.84, "learning_rate": 0.00017448920023350846, "loss": 0.0165, "step": 77400 }, { "epoch": 0.84, "learning_rate": 0.00017447298436790555, "loss": 0.0157, "step": 77410 }, { "epoch": 0.84, "learning_rate": 0.00017445676850230262, "loss": 0.0169, "step": 77420 }, { "epoch": 0.84, "learning_rate": 0.00017444055263669974, "loss": 0.0122, "step": 77430 }, { "epoch": 0.84, "learning_rate": 0.00017442433677109683, "loss": 0.0154, "step": 77440 }, { "epoch": 0.84, "learning_rate": 0.00017440812090549392, "loss": 0.0131, "step": 77450 }, { "epoch": 0.84, "learning_rate": 0.000174391905039891, "loss": 0.0138, "step": 77460 }, { "epoch": 0.84, "learning_rate": 0.0001743756891742881, "loss": 0.0147, "step": 77470 }, { "epoch": 0.84, "learning_rate": 0.0001743594733086852, "loss": 0.0138, "step": 77480 }, { "epoch": 0.84, "learning_rate": 0.0001743432574430823, "loss": 0.0176, "step": 77490 }, { "epoch": 0.84, "learning_rate": 0.0001743270415774794, "loss": 0.0119, "step": 77500 }, { "epoch": 0.84, "learning_rate": 0.00017431082571187648, "loss": 0.0148, "step": 77510 }, { "epoch": 0.84, "learning_rate": 0.00017429460984627357, "loss": 0.0106, "step": 77520 }, { "epoch": 0.84, "learning_rate": 0.0001742783939806707, "loss": 0.0124, "step": 77530 }, { "epoch": 0.84, "learning_rate": 0.00017426217811506776, "loss": 0.017, "step": 77540 }, { "epoch": 0.84, "learning_rate": 0.00017424596224946485, "loss": 0.0129, "step": 77550 }, { "epoch": 0.84, "learning_rate": 0.00017422974638386194, "loss": 0.0123, "step": 77560 }, { "epoch": 0.84, "learning_rate": 0.00017421353051825906, "loss": 0.014, "step": 77570 }, { "epoch": 0.84, "learning_rate": 0.00017419731465265613, "loss": 0.0124, "step": 77580 }, { "epoch": 0.84, "learning_rate": 0.00017418109878705322, "loss": 0.0158, "step": 77590 }, { "epoch": 0.84, "learning_rate": 0.00017416488292145034, "loss": 0.0143, "step": 77600 }, { "epoch": 0.84, "learning_rate": 0.00017414866705584744, "loss": 0.0166, "step": 77610 }, { "epoch": 0.84, "learning_rate": 0.0001741324511902445, "loss": 0.0116, "step": 77620 }, { "epoch": 0.84, "learning_rate": 0.0001741162353246416, "loss": 0.0133, "step": 77630 }, { "epoch": 0.84, "learning_rate": 0.0001741000194590387, "loss": 0.0148, "step": 77640 }, { "epoch": 0.84, "learning_rate": 0.0001740838035934358, "loss": 0.011, "step": 77650 }, { "epoch": 0.84, "learning_rate": 0.00017406758772783287, "loss": 0.0139, "step": 77660 }, { "epoch": 0.84, "learning_rate": 0.00017405137186223, "loss": 0.0132, "step": 77670 }, { "epoch": 0.84, "learning_rate": 0.00017403515599662708, "loss": 0.0162, "step": 77680 }, { "epoch": 0.84, "learning_rate": 0.00017401894013102418, "loss": 0.0156, "step": 77690 }, { "epoch": 0.84, "learning_rate": 0.0001740027242654213, "loss": 0.0136, "step": 77700 }, { "epoch": 0.84, "learning_rate": 0.00017398650839981836, "loss": 0.0116, "step": 77710 }, { "epoch": 0.84, "learning_rate": 0.00017397029253421546, "loss": 0.012, "step": 77720 }, { "epoch": 0.84, "learning_rate": 0.00017395407666861258, "loss": 0.0177, "step": 77730 }, { "epoch": 0.84, "learning_rate": 0.00017393786080300967, "loss": 0.0177, "step": 77740 }, { "epoch": 0.84, "learning_rate": 0.00017392164493740673, "loss": 0.0167, "step": 77750 }, { "epoch": 0.84, "learning_rate": 0.00017390542907180383, "loss": 0.0143, "step": 77760 }, { "epoch": 0.84, "learning_rate": 0.00017388921320620095, "loss": 0.0167, "step": 77770 }, { "epoch": 0.84, "learning_rate": 0.00017387299734059804, "loss": 0.0106, "step": 77780 }, { "epoch": 0.84, "learning_rate": 0.0001738567814749951, "loss": 0.0167, "step": 77790 }, { "epoch": 0.84, "learning_rate": 0.00017384056560939222, "loss": 0.0139, "step": 77800 }, { "epoch": 0.84, "learning_rate": 0.00017382434974378932, "loss": 0.0165, "step": 77810 }, { "epoch": 0.84, "learning_rate": 0.0001738081338781864, "loss": 0.0136, "step": 77820 }, { "epoch": 0.84, "learning_rate": 0.00017379191801258348, "loss": 0.0131, "step": 77830 }, { "epoch": 0.84, "learning_rate": 0.0001737757021469806, "loss": 0.0123, "step": 77840 }, { "epoch": 0.84, "learning_rate": 0.0001737594862813777, "loss": 0.0176, "step": 77850 }, { "epoch": 0.84, "learning_rate": 0.00017374327041577478, "loss": 0.0175, "step": 77860 }, { "epoch": 0.84, "learning_rate": 0.00017372705455017187, "loss": 0.0115, "step": 77870 }, { "epoch": 0.84, "learning_rate": 0.00017371083868456897, "loss": 0.0141, "step": 77880 }, { "epoch": 0.84, "learning_rate": 0.00017369462281896606, "loss": 0.012, "step": 77890 }, { "epoch": 0.84, "learning_rate": 0.00017367840695336318, "loss": 0.0124, "step": 77900 }, { "epoch": 0.84, "learning_rate": 0.00017366219108776024, "loss": 0.0136, "step": 77910 }, { "epoch": 0.84, "learning_rate": 0.00017364597522215734, "loss": 0.0133, "step": 77920 }, { "epoch": 0.84, "learning_rate": 0.00017362975935655443, "loss": 0.012, "step": 77930 }, { "epoch": 0.84, "learning_rate": 0.00017361354349095155, "loss": 0.012, "step": 77940 }, { "epoch": 0.84, "learning_rate": 0.00017359732762534862, "loss": 0.0137, "step": 77950 }, { "epoch": 0.84, "learning_rate": 0.0001735811117597457, "loss": 0.0117, "step": 77960 }, { "epoch": 0.84, "learning_rate": 0.00017356489589414283, "loss": 0.0141, "step": 77970 }, { "epoch": 0.84, "learning_rate": 0.00017354868002853992, "loss": 0.0155, "step": 77980 }, { "epoch": 0.84, "learning_rate": 0.00017353246416293699, "loss": 0.0156, "step": 77990 }, { "epoch": 0.84, "learning_rate": 0.0001735162482973341, "loss": 0.0169, "step": 78000 }, { "epoch": 0.84, "eval_cer": 0.9215347519356817, "eval_loss": 0.00994004588574171, "eval_runtime": 121.1288, "eval_samples_per_second": 16.511, "eval_steps_per_second": 4.128, "step": 78000 }, { "epoch": 0.84, "learning_rate": 0.0001735000324317312, "loss": 0.0134, "step": 78010 }, { "epoch": 0.84, "learning_rate": 0.0001734838165661283, "loss": 0.014, "step": 78020 }, { "epoch": 0.84, "learning_rate": 0.00017346760070052536, "loss": 0.0133, "step": 78030 }, { "epoch": 0.84, "learning_rate": 0.00017345138483492248, "loss": 0.0144, "step": 78040 }, { "epoch": 0.84, "learning_rate": 0.00017343516896931957, "loss": 0.0143, "step": 78050 }, { "epoch": 0.84, "learning_rate": 0.00017341895310371666, "loss": 0.014, "step": 78060 }, { "epoch": 0.84, "learning_rate": 0.00017340273723811376, "loss": 0.0135, "step": 78070 }, { "epoch": 0.84, "learning_rate": 0.00017338652137251085, "loss": 0.0119, "step": 78080 }, { "epoch": 0.84, "learning_rate": 0.00017337030550690794, "loss": 0.0163, "step": 78090 }, { "epoch": 0.84, "learning_rate": 0.00017335408964130506, "loss": 0.0153, "step": 78100 }, { "epoch": 0.84, "learning_rate": 0.00017333787377570213, "loss": 0.0164, "step": 78110 }, { "epoch": 0.84, "learning_rate": 0.00017332165791009922, "loss": 0.0155, "step": 78120 }, { "epoch": 0.84, "learning_rate": 0.0001733054420444963, "loss": 0.0121, "step": 78130 }, { "epoch": 0.84, "learning_rate": 0.00017328922617889343, "loss": 0.0121, "step": 78140 }, { "epoch": 0.84, "learning_rate": 0.0001732730103132905, "loss": 0.0183, "step": 78150 }, { "epoch": 0.84, "learning_rate": 0.0001732567944476876, "loss": 0.0189, "step": 78160 }, { "epoch": 0.85, "learning_rate": 0.0001732405785820847, "loss": 0.0168, "step": 78170 }, { "epoch": 0.85, "learning_rate": 0.0001732243627164818, "loss": 0.0151, "step": 78180 }, { "epoch": 0.85, "learning_rate": 0.00017320814685087887, "loss": 0.0166, "step": 78190 }, { "epoch": 0.85, "learning_rate": 0.00017319193098527596, "loss": 0.0145, "step": 78200 }, { "epoch": 0.85, "learning_rate": 0.00017317571511967308, "loss": 0.0133, "step": 78210 }, { "epoch": 0.85, "learning_rate": 0.00017315949925407017, "loss": 0.0125, "step": 78220 }, { "epoch": 0.85, "learning_rate": 0.00017314328338846724, "loss": 0.0152, "step": 78230 }, { "epoch": 0.85, "learning_rate": 0.00017312706752286436, "loss": 0.0146, "step": 78240 }, { "epoch": 0.85, "learning_rate": 0.00017311085165726145, "loss": 0.0147, "step": 78250 }, { "epoch": 0.85, "learning_rate": 0.00017309463579165854, "loss": 0.0105, "step": 78260 }, { "epoch": 0.85, "learning_rate": 0.0001730784199260556, "loss": 0.0123, "step": 78270 }, { "epoch": 0.85, "learning_rate": 0.00017306220406045273, "loss": 0.0122, "step": 78280 }, { "epoch": 0.85, "learning_rate": 0.00017304598819484982, "loss": 0.0181, "step": 78290 }, { "epoch": 0.85, "learning_rate": 0.00017302977232924694, "loss": 0.0102, "step": 78300 }, { "epoch": 0.85, "learning_rate": 0.000173013556463644, "loss": 0.0165, "step": 78310 }, { "epoch": 0.85, "learning_rate": 0.0001729973405980411, "loss": 0.0128, "step": 78320 }, { "epoch": 0.85, "learning_rate": 0.0001729811247324382, "loss": 0.013, "step": 78330 }, { "epoch": 0.85, "learning_rate": 0.00017296490886683531, "loss": 0.0156, "step": 78340 }, { "epoch": 0.85, "learning_rate": 0.00017294869300123238, "loss": 0.0138, "step": 78350 }, { "epoch": 0.85, "learning_rate": 0.00017293247713562947, "loss": 0.0132, "step": 78360 }, { "epoch": 0.85, "learning_rate": 0.0001729162612700266, "loss": 0.0126, "step": 78370 }, { "epoch": 0.85, "learning_rate": 0.00017290004540442368, "loss": 0.0138, "step": 78380 }, { "epoch": 0.85, "learning_rate": 0.00017288382953882075, "loss": 0.0125, "step": 78390 }, { "epoch": 0.85, "learning_rate": 0.00017286761367321784, "loss": 0.0158, "step": 78400 }, { "epoch": 0.85, "learning_rate": 0.00017285139780761496, "loss": 0.011, "step": 78410 }, { "epoch": 0.85, "learning_rate": 0.00017283518194201206, "loss": 0.0132, "step": 78420 }, { "epoch": 0.85, "learning_rate": 0.00017281896607640915, "loss": 0.0147, "step": 78430 }, { "epoch": 0.85, "learning_rate": 0.00017280275021080624, "loss": 0.0134, "step": 78440 }, { "epoch": 0.85, "learning_rate": 0.00017278653434520333, "loss": 0.012, "step": 78450 }, { "epoch": 0.85, "learning_rate": 0.00017277031847960043, "loss": 0.0161, "step": 78460 }, { "epoch": 0.85, "learning_rate": 0.00017275410261399755, "loss": 0.0139, "step": 78470 }, { "epoch": 0.85, "learning_rate": 0.0001727378867483946, "loss": 0.0105, "step": 78480 }, { "epoch": 0.85, "learning_rate": 0.0001727216708827917, "loss": 0.0136, "step": 78490 }, { "epoch": 0.85, "learning_rate": 0.0001727054550171888, "loss": 0.0132, "step": 78500 }, { "epoch": 0.85, "learning_rate": 0.00017268923915158592, "loss": 0.0118, "step": 78510 }, { "epoch": 0.85, "learning_rate": 0.00017267302328598298, "loss": 0.0138, "step": 78520 }, { "epoch": 0.85, "learning_rate": 0.00017265680742038008, "loss": 0.015, "step": 78530 }, { "epoch": 0.85, "learning_rate": 0.0001726405915547772, "loss": 0.0159, "step": 78540 }, { "epoch": 0.85, "learning_rate": 0.0001726243756891743, "loss": 0.0165, "step": 78550 }, { "epoch": 0.85, "learning_rate": 0.00017260815982357135, "loss": 0.0151, "step": 78560 }, { "epoch": 0.85, "learning_rate": 0.00017259194395796845, "loss": 0.0167, "step": 78570 }, { "epoch": 0.85, "learning_rate": 0.00017257572809236557, "loss": 0.0117, "step": 78580 }, { "epoch": 0.85, "learning_rate": 0.00017255951222676266, "loss": 0.0116, "step": 78590 }, { "epoch": 0.85, "learning_rate": 0.00017254329636115973, "loss": 0.0128, "step": 78600 }, { "epoch": 0.85, "learning_rate": 0.00017252708049555684, "loss": 0.016, "step": 78610 }, { "epoch": 0.85, "learning_rate": 0.00017251086462995394, "loss": 0.0151, "step": 78620 }, { "epoch": 0.85, "learning_rate": 0.00017249464876435103, "loss": 0.0127, "step": 78630 }, { "epoch": 0.85, "learning_rate": 0.0001724784328987481, "loss": 0.0124, "step": 78640 }, { "epoch": 0.85, "learning_rate": 0.00017246221703314522, "loss": 0.0142, "step": 78650 }, { "epoch": 0.85, "learning_rate": 0.0001724460011675423, "loss": 0.0123, "step": 78660 }, { "epoch": 0.85, "learning_rate": 0.00017242978530193943, "loss": 0.0135, "step": 78670 }, { "epoch": 0.85, "learning_rate": 0.0001724135694363365, "loss": 0.0108, "step": 78680 }, { "epoch": 0.85, "learning_rate": 0.0001723973535707336, "loss": 0.0115, "step": 78690 }, { "epoch": 0.85, "learning_rate": 0.00017238113770513068, "loss": 0.0113, "step": 78700 }, { "epoch": 0.85, "learning_rate": 0.0001723649218395278, "loss": 0.013, "step": 78710 }, { "epoch": 0.85, "learning_rate": 0.00017234870597392487, "loss": 0.0125, "step": 78720 }, { "epoch": 0.85, "learning_rate": 0.00017233249010832196, "loss": 0.0134, "step": 78730 }, { "epoch": 0.85, "learning_rate": 0.00017231627424271908, "loss": 0.0162, "step": 78740 }, { "epoch": 0.85, "learning_rate": 0.00017230005837711617, "loss": 0.0125, "step": 78750 }, { "epoch": 0.85, "learning_rate": 0.00017228384251151324, "loss": 0.0135, "step": 78760 }, { "epoch": 0.85, "learning_rate": 0.00017226762664591033, "loss": 0.0142, "step": 78770 }, { "epoch": 0.85, "learning_rate": 0.00017225141078030745, "loss": 0.012, "step": 78780 }, { "epoch": 0.85, "learning_rate": 0.00017223519491470454, "loss": 0.0121, "step": 78790 }, { "epoch": 0.85, "learning_rate": 0.0001722189790491016, "loss": 0.0146, "step": 78800 }, { "epoch": 0.85, "learning_rate": 0.00017220276318349873, "loss": 0.0143, "step": 78810 }, { "epoch": 0.85, "learning_rate": 0.00017218654731789582, "loss": 0.0112, "step": 78820 }, { "epoch": 0.85, "learning_rate": 0.0001721703314522929, "loss": 0.0154, "step": 78830 }, { "epoch": 0.85, "learning_rate": 0.00017215411558668998, "loss": 0.0126, "step": 78840 }, { "epoch": 0.85, "learning_rate": 0.0001721378997210871, "loss": 0.0148, "step": 78850 }, { "epoch": 0.85, "learning_rate": 0.0001721216838554842, "loss": 0.0135, "step": 78860 }, { "epoch": 0.85, "learning_rate": 0.00017210546798988128, "loss": 0.0144, "step": 78870 }, { "epoch": 0.85, "learning_rate": 0.00017208925212427838, "loss": 0.0126, "step": 78880 }, { "epoch": 0.85, "learning_rate": 0.00017207303625867547, "loss": 0.0135, "step": 78890 }, { "epoch": 0.85, "learning_rate": 0.00017205682039307256, "loss": 0.011, "step": 78900 }, { "epoch": 0.85, "learning_rate": 0.00017204060452746968, "loss": 0.0125, "step": 78910 }, { "epoch": 0.85, "learning_rate": 0.00017202438866186675, "loss": 0.0218, "step": 78920 }, { "epoch": 0.85, "learning_rate": 0.00017200817279626384, "loss": 0.013, "step": 78930 }, { "epoch": 0.85, "learning_rate": 0.00017199195693066093, "loss": 0.0125, "step": 78940 }, { "epoch": 0.85, "learning_rate": 0.00017197574106505805, "loss": 0.0154, "step": 78950 }, { "epoch": 0.85, "learning_rate": 0.00017195952519945512, "loss": 0.0139, "step": 78960 }, { "epoch": 0.85, "learning_rate": 0.0001719433093338522, "loss": 0.011, "step": 78970 }, { "epoch": 0.85, "learning_rate": 0.00017192709346824933, "loss": 0.0168, "step": 78980 }, { "epoch": 0.85, "learning_rate": 0.00017191087760264642, "loss": 0.0151, "step": 78990 }, { "epoch": 0.85, "learning_rate": 0.0001718946617370435, "loss": 0.0118, "step": 79000 }, { "epoch": 0.85, "eval_cer": 0.9215269345090743, "eval_loss": 0.010222644545137882, "eval_runtime": 121.2156, "eval_samples_per_second": 16.5, "eval_steps_per_second": 4.125, "step": 79000 }, { "epoch": 0.85, "learning_rate": 0.0001718784458714406, "loss": 0.0163, "step": 79010 }, { "epoch": 0.85, "learning_rate": 0.0001718622300058377, "loss": 0.0147, "step": 79020 }, { "epoch": 0.85, "learning_rate": 0.0001718460141402348, "loss": 0.0117, "step": 79030 }, { "epoch": 0.85, "learning_rate": 0.00017182979827463186, "loss": 0.0135, "step": 79040 }, { "epoch": 0.85, "learning_rate": 0.00017181358240902898, "loss": 0.0129, "step": 79050 }, { "epoch": 0.85, "learning_rate": 0.00017179736654342607, "loss": 0.0142, "step": 79060 }, { "epoch": 0.85, "learning_rate": 0.00017178115067782317, "loss": 0.0142, "step": 79070 }, { "epoch": 0.85, "learning_rate": 0.00017176493481222026, "loss": 0.0154, "step": 79080 }, { "epoch": 0.86, "learning_rate": 0.00017174871894661735, "loss": 0.0135, "step": 79090 }, { "epoch": 0.86, "learning_rate": 0.00017173250308101444, "loss": 0.014, "step": 79100 }, { "epoch": 0.86, "learning_rate": 0.00017171628721541156, "loss": 0.016, "step": 79110 }, { "epoch": 0.86, "learning_rate": 0.00017170007134980863, "loss": 0.0166, "step": 79120 }, { "epoch": 0.86, "learning_rate": 0.00017168385548420572, "loss": 0.0118, "step": 79130 }, { "epoch": 0.86, "learning_rate": 0.00017166763961860281, "loss": 0.019, "step": 79140 }, { "epoch": 0.86, "learning_rate": 0.00017165142375299993, "loss": 0.0133, "step": 79150 }, { "epoch": 0.86, "learning_rate": 0.00017163520788739703, "loss": 0.0132, "step": 79160 }, { "epoch": 0.86, "learning_rate": 0.0001716189920217941, "loss": 0.0187, "step": 79170 }, { "epoch": 0.86, "learning_rate": 0.0001716027761561912, "loss": 0.0116, "step": 79180 }, { "epoch": 0.86, "learning_rate": 0.0001715865602905883, "loss": 0.0122, "step": 79190 }, { "epoch": 0.86, "learning_rate": 0.0001715703444249854, "loss": 0.0137, "step": 79200 }, { "epoch": 0.86, "learning_rate": 0.00017155412855938246, "loss": 0.014, "step": 79210 }, { "epoch": 0.86, "learning_rate": 0.00017153791269377958, "loss": 0.012, "step": 79220 }, { "epoch": 0.86, "learning_rate": 0.00017152169682817668, "loss": 0.0128, "step": 79230 }, { "epoch": 0.86, "learning_rate": 0.00017150548096257377, "loss": 0.0124, "step": 79240 }, { "epoch": 0.86, "learning_rate": 0.00017148926509697086, "loss": 0.0127, "step": 79250 }, { "epoch": 0.86, "learning_rate": 0.00017147304923136795, "loss": 0.0123, "step": 79260 }, { "epoch": 0.86, "learning_rate": 0.00017145683336576505, "loss": 0.0139, "step": 79270 }, { "epoch": 0.86, "learning_rate": 0.00017144061750016217, "loss": 0.0105, "step": 79280 }, { "epoch": 0.86, "learning_rate": 0.00017142440163455923, "loss": 0.0129, "step": 79290 }, { "epoch": 0.86, "learning_rate": 0.00017140818576895633, "loss": 0.012, "step": 79300 }, { "epoch": 0.86, "learning_rate": 0.00017139196990335345, "loss": 0.015, "step": 79310 }, { "epoch": 0.86, "learning_rate": 0.00017137575403775054, "loss": 0.0134, "step": 79320 }, { "epoch": 0.86, "learning_rate": 0.0001713595381721476, "loss": 0.0149, "step": 79330 }, { "epoch": 0.86, "learning_rate": 0.0001713433223065447, "loss": 0.0136, "step": 79340 }, { "epoch": 0.86, "learning_rate": 0.00017132710644094182, "loss": 0.0129, "step": 79350 }, { "epoch": 0.86, "learning_rate": 0.0001713108905753389, "loss": 0.0164, "step": 79360 }, { "epoch": 0.86, "learning_rate": 0.00017129467470973597, "loss": 0.0175, "step": 79370 }, { "epoch": 0.86, "learning_rate": 0.0001712784588441331, "loss": 0.0123, "step": 79380 }, { "epoch": 0.86, "learning_rate": 0.0001712622429785302, "loss": 0.0143, "step": 79390 }, { "epoch": 0.86, "learning_rate": 0.00017124602711292728, "loss": 0.0144, "step": 79400 }, { "epoch": 0.86, "learning_rate": 0.00017122981124732435, "loss": 0.0134, "step": 79410 }, { "epoch": 0.86, "learning_rate": 0.00017121359538172147, "loss": 0.0124, "step": 79420 }, { "epoch": 0.86, "learning_rate": 0.00017119737951611856, "loss": 0.0125, "step": 79430 }, { "epoch": 0.86, "learning_rate": 0.00017118116365051565, "loss": 0.0142, "step": 79440 }, { "epoch": 0.86, "learning_rate": 0.00017116494778491274, "loss": 0.0128, "step": 79450 }, { "epoch": 0.86, "learning_rate": 0.00017114873191930984, "loss": 0.012, "step": 79460 }, { "epoch": 0.86, "learning_rate": 0.00017113251605370693, "loss": 0.012, "step": 79470 }, { "epoch": 0.86, "learning_rate": 0.00017111630018810405, "loss": 0.0148, "step": 79480 }, { "epoch": 0.86, "learning_rate": 0.00017110008432250111, "loss": 0.0139, "step": 79490 }, { "epoch": 0.86, "learning_rate": 0.0001710838684568982, "loss": 0.0116, "step": 79500 }, { "epoch": 0.86, "learning_rate": 0.0001710676525912953, "loss": 0.0152, "step": 79510 }, { "epoch": 0.86, "learning_rate": 0.00017105143672569242, "loss": 0.0117, "step": 79520 }, { "epoch": 0.86, "learning_rate": 0.00017103522086008949, "loss": 0.0124, "step": 79530 }, { "epoch": 0.86, "learning_rate": 0.00017101900499448658, "loss": 0.013, "step": 79540 }, { "epoch": 0.86, "learning_rate": 0.0001710027891288837, "loss": 0.0163, "step": 79550 }, { "epoch": 0.86, "learning_rate": 0.0001709865732632808, "loss": 0.0131, "step": 79560 }, { "epoch": 0.86, "learning_rate": 0.00017097035739767786, "loss": 0.0126, "step": 79570 }, { "epoch": 0.86, "learning_rate": 0.00017095414153207495, "loss": 0.0141, "step": 79580 }, { "epoch": 0.86, "learning_rate": 0.00017093792566647207, "loss": 0.0153, "step": 79590 }, { "epoch": 0.86, "learning_rate": 0.00017092170980086916, "loss": 0.0139, "step": 79600 }, { "epoch": 0.86, "learning_rate": 0.00017090549393526623, "loss": 0.0127, "step": 79610 }, { "epoch": 0.86, "learning_rate": 0.00017088927806966335, "loss": 0.0146, "step": 79620 }, { "epoch": 0.86, "learning_rate": 0.00017087306220406044, "loss": 0.0122, "step": 79630 }, { "epoch": 0.86, "learning_rate": 0.00017085684633845753, "loss": 0.0161, "step": 79640 }, { "epoch": 0.86, "learning_rate": 0.0001708406304728546, "loss": 0.014, "step": 79650 }, { "epoch": 0.86, "learning_rate": 0.00017082441460725172, "loss": 0.015, "step": 79660 }, { "epoch": 0.86, "learning_rate": 0.0001708081987416488, "loss": 0.0102, "step": 79670 }, { "epoch": 0.86, "learning_rate": 0.00017079198287604593, "loss": 0.0135, "step": 79680 }, { "epoch": 0.86, "learning_rate": 0.000170775767010443, "loss": 0.0132, "step": 79690 }, { "epoch": 0.86, "learning_rate": 0.0001707595511448401, "loss": 0.0136, "step": 79700 }, { "epoch": 0.86, "learning_rate": 0.00017074333527923718, "loss": 0.0145, "step": 79710 }, { "epoch": 0.86, "learning_rate": 0.0001707271194136343, "loss": 0.0163, "step": 79720 }, { "epoch": 0.86, "learning_rate": 0.00017071090354803137, "loss": 0.0138, "step": 79730 }, { "epoch": 0.86, "learning_rate": 0.00017069468768242846, "loss": 0.0111, "step": 79740 }, { "epoch": 0.86, "learning_rate": 0.00017067847181682558, "loss": 0.012, "step": 79750 }, { "epoch": 0.86, "learning_rate": 0.00017066225595122267, "loss": 0.0192, "step": 79760 }, { "epoch": 0.86, "learning_rate": 0.00017064604008561974, "loss": 0.0165, "step": 79770 }, { "epoch": 0.86, "learning_rate": 0.00017062982422001683, "loss": 0.0143, "step": 79780 }, { "epoch": 0.86, "learning_rate": 0.00017061360835441395, "loss": 0.0154, "step": 79790 }, { "epoch": 0.86, "learning_rate": 0.00017059739248881104, "loss": 0.0127, "step": 79800 }, { "epoch": 0.86, "learning_rate": 0.0001705811766232081, "loss": 0.0167, "step": 79810 }, { "epoch": 0.86, "learning_rate": 0.00017056496075760523, "loss": 0.0135, "step": 79820 }, { "epoch": 0.86, "learning_rate": 0.00017054874489200232, "loss": 0.0143, "step": 79830 }, { "epoch": 0.86, "learning_rate": 0.00017053252902639941, "loss": 0.0157, "step": 79840 }, { "epoch": 0.86, "learning_rate": 0.00017051631316079653, "loss": 0.0158, "step": 79850 }, { "epoch": 0.86, "learning_rate": 0.0001705000972951936, "loss": 0.0123, "step": 79860 }, { "epoch": 0.86, "learning_rate": 0.0001704838814295907, "loss": 0.0112, "step": 79870 }, { "epoch": 0.86, "learning_rate": 0.00017046766556398779, "loss": 0.0127, "step": 79880 }, { "epoch": 0.86, "learning_rate": 0.0001704514496983849, "loss": 0.014, "step": 79890 }, { "epoch": 0.86, "learning_rate": 0.00017043523383278197, "loss": 0.0152, "step": 79900 }, { "epoch": 0.86, "learning_rate": 0.00017041901796717906, "loss": 0.0139, "step": 79910 }, { "epoch": 0.86, "learning_rate": 0.00017040280210157618, "loss": 0.0141, "step": 79920 }, { "epoch": 0.86, "learning_rate": 0.00017038658623597328, "loss": 0.0137, "step": 79930 }, { "epoch": 0.86, "learning_rate": 0.00017037037037037034, "loss": 0.0168, "step": 79940 }, { "epoch": 0.86, "learning_rate": 0.00017035415450476744, "loss": 0.0143, "step": 79950 }, { "epoch": 0.86, "learning_rate": 0.00017033793863916455, "loss": 0.0155, "step": 79960 }, { "epoch": 0.86, "learning_rate": 0.00017032172277356165, "loss": 0.0136, "step": 79970 }, { "epoch": 0.86, "learning_rate": 0.0001703055069079587, "loss": 0.0139, "step": 79980 }, { "epoch": 0.86, "learning_rate": 0.00017028929104235583, "loss": 0.0135, "step": 79990 }, { "epoch": 0.86, "learning_rate": 0.00017027307517675293, "loss": 0.0178, "step": 80000 }, { "epoch": 0.86, "eval_cer": 0.9215417007593327, "eval_loss": 0.009527038782835007, "eval_runtime": 121.101, "eval_samples_per_second": 16.515, "eval_steps_per_second": 4.129, "step": 80000 }, { "epoch": 0.86, "learning_rate": 0.00017025685931115002, "loss": 0.0148, "step": 80010 }, { "epoch": 0.87, "learning_rate": 0.0001702406434455471, "loss": 0.0141, "step": 80020 }, { "epoch": 0.87, "learning_rate": 0.0001702244275799442, "loss": 0.0139, "step": 80030 }, { "epoch": 0.87, "learning_rate": 0.0001702082117143413, "loss": 0.0109, "step": 80040 }, { "epoch": 0.87, "learning_rate": 0.00017019199584873842, "loss": 0.0125, "step": 80050 }, { "epoch": 0.87, "learning_rate": 0.00017017577998313548, "loss": 0.014, "step": 80060 }, { "epoch": 0.87, "learning_rate": 0.00017015956411753258, "loss": 0.0139, "step": 80070 }, { "epoch": 0.87, "learning_rate": 0.00017014334825192967, "loss": 0.0113, "step": 80080 }, { "epoch": 0.87, "learning_rate": 0.0001701271323863268, "loss": 0.0108, "step": 80090 }, { "epoch": 0.87, "learning_rate": 0.00017011091652072385, "loss": 0.0129, "step": 80100 }, { "epoch": 0.87, "learning_rate": 0.00017009470065512095, "loss": 0.0155, "step": 80110 }, { "epoch": 0.87, "learning_rate": 0.00017007848478951807, "loss": 0.0134, "step": 80120 }, { "epoch": 0.87, "learning_rate": 0.00017006226892391516, "loss": 0.0146, "step": 80130 }, { "epoch": 0.87, "learning_rate": 0.00017004605305831222, "loss": 0.0107, "step": 80140 }, { "epoch": 0.87, "learning_rate": 0.00017002983719270932, "loss": 0.0114, "step": 80150 }, { "epoch": 0.87, "learning_rate": 0.00017001362132710644, "loss": 0.0129, "step": 80160 }, { "epoch": 0.87, "learning_rate": 0.00016999740546150353, "loss": 0.0097, "step": 80170 }, { "epoch": 0.87, "learning_rate": 0.0001699811895959006, "loss": 0.0138, "step": 80180 }, { "epoch": 0.87, "learning_rate": 0.00016996497373029772, "loss": 0.0104, "step": 80190 }, { "epoch": 0.87, "learning_rate": 0.0001699487578646948, "loss": 0.0146, "step": 80200 }, { "epoch": 0.87, "learning_rate": 0.0001699325419990919, "loss": 0.0138, "step": 80210 }, { "epoch": 0.87, "learning_rate": 0.00016991632613348897, "loss": 0.014, "step": 80220 }, { "epoch": 0.87, "learning_rate": 0.00016990011026788609, "loss": 0.0145, "step": 80230 }, { "epoch": 0.87, "learning_rate": 0.00016988389440228318, "loss": 0.0102, "step": 80240 }, { "epoch": 0.87, "learning_rate": 0.00016986767853668027, "loss": 0.0148, "step": 80250 }, { "epoch": 0.87, "learning_rate": 0.00016985146267107736, "loss": 0.0156, "step": 80260 }, { "epoch": 0.87, "learning_rate": 0.00016983524680547446, "loss": 0.0134, "step": 80270 }, { "epoch": 0.87, "learning_rate": 0.00016981903093987155, "loss": 0.0139, "step": 80280 }, { "epoch": 0.87, "learning_rate": 0.00016980281507426867, "loss": 0.0149, "step": 80290 }, { "epoch": 0.87, "learning_rate": 0.00016978659920866574, "loss": 0.0121, "step": 80300 }, { "epoch": 0.87, "learning_rate": 0.00016977038334306283, "loss": 0.015, "step": 80310 }, { "epoch": 0.87, "learning_rate": 0.00016975416747745995, "loss": 0.0144, "step": 80320 }, { "epoch": 0.87, "learning_rate": 0.00016973795161185704, "loss": 0.0129, "step": 80330 }, { "epoch": 0.87, "learning_rate": 0.0001697217357462541, "loss": 0.0127, "step": 80340 }, { "epoch": 0.87, "learning_rate": 0.0001697055198806512, "loss": 0.0142, "step": 80350 }, { "epoch": 0.87, "learning_rate": 0.00016968930401504832, "loss": 0.0122, "step": 80360 }, { "epoch": 0.87, "learning_rate": 0.0001696730881494454, "loss": 0.014, "step": 80370 }, { "epoch": 0.87, "learning_rate": 0.00016965687228384248, "loss": 0.0144, "step": 80380 }, { "epoch": 0.87, "learning_rate": 0.0001696406564182396, "loss": 0.0154, "step": 80390 }, { "epoch": 0.87, "learning_rate": 0.0001696244405526367, "loss": 0.0111, "step": 80400 }, { "epoch": 0.87, "learning_rate": 0.00016960822468703378, "loss": 0.0138, "step": 80410 }, { "epoch": 0.87, "learning_rate": 0.00016959200882143085, "loss": 0.0124, "step": 80420 }, { "epoch": 0.87, "learning_rate": 0.00016957579295582797, "loss": 0.0161, "step": 80430 }, { "epoch": 0.87, "learning_rate": 0.00016955957709022506, "loss": 0.0144, "step": 80440 }, { "epoch": 0.87, "learning_rate": 0.00016954336122462215, "loss": 0.0145, "step": 80450 }, { "epoch": 0.87, "learning_rate": 0.00016952714535901925, "loss": 0.0149, "step": 80460 }, { "epoch": 0.87, "learning_rate": 0.00016951092949341634, "loss": 0.0133, "step": 80470 }, { "epoch": 0.87, "learning_rate": 0.00016949471362781343, "loss": 0.014, "step": 80480 }, { "epoch": 0.87, "learning_rate": 0.00016947849776221055, "loss": 0.0118, "step": 80490 }, { "epoch": 0.87, "learning_rate": 0.00016946228189660762, "loss": 0.0106, "step": 80500 }, { "epoch": 0.87, "learning_rate": 0.0001694460660310047, "loss": 0.0128, "step": 80510 }, { "epoch": 0.87, "learning_rate": 0.0001694298501654018, "loss": 0.0136, "step": 80520 }, { "epoch": 0.87, "learning_rate": 0.00016941363429979892, "loss": 0.014, "step": 80530 }, { "epoch": 0.87, "learning_rate": 0.000169397418434196, "loss": 0.0122, "step": 80540 }, { "epoch": 0.87, "learning_rate": 0.00016938120256859308, "loss": 0.0121, "step": 80550 }, { "epoch": 0.87, "learning_rate": 0.0001693649867029902, "loss": 0.0116, "step": 80560 }, { "epoch": 0.87, "learning_rate": 0.0001693487708373873, "loss": 0.0124, "step": 80570 }, { "epoch": 0.87, "learning_rate": 0.00016933255497178439, "loss": 0.0138, "step": 80580 }, { "epoch": 0.87, "learning_rate": 0.00016931633910618145, "loss": 0.0121, "step": 80590 }, { "epoch": 0.87, "learning_rate": 0.00016930012324057857, "loss": 0.0143, "step": 80600 }, { "epoch": 0.87, "learning_rate": 0.00016928390737497566, "loss": 0.0143, "step": 80610 }, { "epoch": 0.87, "learning_rate": 0.00016926769150937278, "loss": 0.0124, "step": 80620 }, { "epoch": 0.87, "learning_rate": 0.00016925147564376985, "loss": 0.0122, "step": 80630 }, { "epoch": 0.87, "learning_rate": 0.00016923525977816694, "loss": 0.0122, "step": 80640 }, { "epoch": 0.87, "learning_rate": 0.00016921904391256404, "loss": 0.0135, "step": 80650 }, { "epoch": 0.87, "learning_rate": 0.00016920282804696116, "loss": 0.0125, "step": 80660 }, { "epoch": 0.87, "learning_rate": 0.00016918661218135822, "loss": 0.019, "step": 80670 }, { "epoch": 0.87, "learning_rate": 0.00016917039631575531, "loss": 0.0127, "step": 80680 }, { "epoch": 0.87, "learning_rate": 0.00016915418045015243, "loss": 0.0105, "step": 80690 }, { "epoch": 0.87, "learning_rate": 0.00016913796458454953, "loss": 0.0115, "step": 80700 }, { "epoch": 0.87, "learning_rate": 0.0001691217487189466, "loss": 0.0146, "step": 80710 }, { "epoch": 0.87, "learning_rate": 0.00016910553285334368, "loss": 0.0143, "step": 80720 }, { "epoch": 0.87, "learning_rate": 0.0001690893169877408, "loss": 0.0119, "step": 80730 }, { "epoch": 0.87, "learning_rate": 0.0001690731011221379, "loss": 0.0138, "step": 80740 }, { "epoch": 0.87, "learning_rate": 0.00016905688525653496, "loss": 0.0173, "step": 80750 }, { "epoch": 0.87, "learning_rate": 0.00016904066939093208, "loss": 0.0135, "step": 80760 }, { "epoch": 0.87, "learning_rate": 0.00016902445352532918, "loss": 0.0135, "step": 80770 }, { "epoch": 0.87, "learning_rate": 0.00016900823765972627, "loss": 0.0125, "step": 80780 }, { "epoch": 0.87, "learning_rate": 0.00016899202179412333, "loss": 0.0128, "step": 80790 }, { "epoch": 0.87, "learning_rate": 0.00016897580592852045, "loss": 0.0148, "step": 80800 }, { "epoch": 0.87, "learning_rate": 0.00016895959006291755, "loss": 0.0145, "step": 80810 }, { "epoch": 0.87, "learning_rate": 0.00016894337419731464, "loss": 0.013, "step": 80820 }, { "epoch": 0.87, "learning_rate": 0.00016892715833171173, "loss": 0.0157, "step": 80830 }, { "epoch": 0.87, "learning_rate": 0.00016891094246610882, "loss": 0.0147, "step": 80840 }, { "epoch": 0.87, "learning_rate": 0.00016889472660050592, "loss": 0.0128, "step": 80850 }, { "epoch": 0.87, "learning_rate": 0.00016887851073490304, "loss": 0.0148, "step": 80860 }, { "epoch": 0.87, "learning_rate": 0.0001688622948693001, "loss": 0.0134, "step": 80870 }, { "epoch": 0.87, "learning_rate": 0.0001688460790036972, "loss": 0.0116, "step": 80880 }, { "epoch": 0.87, "learning_rate": 0.0001688298631380943, "loss": 0.0117, "step": 80890 }, { "epoch": 0.87, "learning_rate": 0.0001688136472724914, "loss": 0.0125, "step": 80900 }, { "epoch": 0.87, "learning_rate": 0.00016879743140688847, "loss": 0.0134, "step": 80910 }, { "epoch": 0.87, "learning_rate": 0.00016878121554128557, "loss": 0.0136, "step": 80920 }, { "epoch": 0.87, "learning_rate": 0.0001687649996756827, "loss": 0.0156, "step": 80930 }, { "epoch": 0.88, "learning_rate": 0.00016874878381007978, "loss": 0.0128, "step": 80940 }, { "epoch": 0.88, "learning_rate": 0.00016873256794447685, "loss": 0.0128, "step": 80950 }, { "epoch": 0.88, "learning_rate": 0.00016871635207887394, "loss": 0.0135, "step": 80960 }, { "epoch": 0.88, "learning_rate": 0.00016870013621327106, "loss": 0.0134, "step": 80970 }, { "epoch": 0.88, "learning_rate": 0.00016868392034766815, "loss": 0.0192, "step": 80980 }, { "epoch": 0.88, "learning_rate": 0.00016866770448206522, "loss": 0.0149, "step": 80990 }, { "epoch": 0.88, "learning_rate": 0.00016865148861646234, "loss": 0.0145, "step": 81000 }, { "epoch": 0.88, "eval_cer": 0.9215668902450677, "eval_loss": 0.009719022549688816, "eval_runtime": 121.2086, "eval_samples_per_second": 16.5, "eval_steps_per_second": 4.125, "step": 81000 }, { "epoch": 0.88, "learning_rate": 0.00016863527275085943, "loss": 0.0142, "step": 81010 }, { "epoch": 0.88, "learning_rate": 0.00016861905688525652, "loss": 0.0147, "step": 81020 }, { "epoch": 0.88, "learning_rate": 0.00016860284101965361, "loss": 0.0128, "step": 81030 }, { "epoch": 0.88, "learning_rate": 0.0001685866251540507, "loss": 0.0136, "step": 81040 }, { "epoch": 0.88, "learning_rate": 0.0001685704092884478, "loss": 0.0129, "step": 81050 }, { "epoch": 0.88, "learning_rate": 0.00016855419342284492, "loss": 0.0127, "step": 81060 }, { "epoch": 0.88, "learning_rate": 0.00016853797755724199, "loss": 0.0123, "step": 81070 }, { "epoch": 0.88, "learning_rate": 0.00016852176169163908, "loss": 0.0125, "step": 81080 }, { "epoch": 0.88, "learning_rate": 0.00016850554582603617, "loss": 0.011, "step": 81090 }, { "epoch": 0.88, "learning_rate": 0.0001684893299604333, "loss": 0.0137, "step": 81100 }, { "epoch": 0.88, "learning_rate": 0.00016847311409483036, "loss": 0.0146, "step": 81110 }, { "epoch": 0.88, "learning_rate": 0.00016845689822922745, "loss": 0.0126, "step": 81120 }, { "epoch": 0.88, "learning_rate": 0.00016844068236362457, "loss": 0.0086, "step": 81130 }, { "epoch": 0.88, "learning_rate": 0.00016842446649802166, "loss": 0.0144, "step": 81140 }, { "epoch": 0.88, "learning_rate": 0.00016840825063241873, "loss": 0.0136, "step": 81150 }, { "epoch": 0.88, "learning_rate": 0.00016839203476681582, "loss": 0.0122, "step": 81160 }, { "epoch": 0.88, "learning_rate": 0.00016837581890121294, "loss": 0.0107, "step": 81170 }, { "epoch": 0.88, "learning_rate": 0.00016835960303561003, "loss": 0.0135, "step": 81180 }, { "epoch": 0.88, "learning_rate": 0.0001683433871700071, "loss": 0.0186, "step": 81190 }, { "epoch": 0.88, "learning_rate": 0.00016832717130440422, "loss": 0.0132, "step": 81200 }, { "epoch": 0.88, "learning_rate": 0.0001683109554388013, "loss": 0.0112, "step": 81210 }, { "epoch": 0.88, "learning_rate": 0.0001682947395731984, "loss": 0.0132, "step": 81220 }, { "epoch": 0.88, "learning_rate": 0.00016827852370759547, "loss": 0.0125, "step": 81230 }, { "epoch": 0.88, "learning_rate": 0.0001682623078419926, "loss": 0.0137, "step": 81240 }, { "epoch": 0.88, "learning_rate": 0.00016824609197638968, "loss": 0.013, "step": 81250 }, { "epoch": 0.88, "learning_rate": 0.00016822987611078677, "loss": 0.014, "step": 81260 }, { "epoch": 0.88, "learning_rate": 0.00016821366024518387, "loss": 0.0149, "step": 81270 }, { "epoch": 0.88, "learning_rate": 0.00016819744437958096, "loss": 0.0146, "step": 81280 }, { "epoch": 0.88, "learning_rate": 0.00016818122851397805, "loss": 0.0109, "step": 81290 }, { "epoch": 0.88, "learning_rate": 0.00016816501264837517, "loss": 0.0127, "step": 81300 }, { "epoch": 0.88, "learning_rate": 0.00016814879678277227, "loss": 0.0104, "step": 81310 }, { "epoch": 0.88, "learning_rate": 0.00016813258091716933, "loss": 0.0128, "step": 81320 }, { "epoch": 0.88, "learning_rate": 0.00016811636505156645, "loss": 0.0152, "step": 81330 }, { "epoch": 0.88, "learning_rate": 0.00016810014918596354, "loss": 0.0124, "step": 81340 }, { "epoch": 0.88, "learning_rate": 0.00016808393332036064, "loss": 0.0137, "step": 81350 }, { "epoch": 0.88, "learning_rate": 0.0001680677174547577, "loss": 0.0146, "step": 81360 }, { "epoch": 0.88, "learning_rate": 0.00016805150158915482, "loss": 0.0121, "step": 81370 }, { "epoch": 0.88, "learning_rate": 0.00016803528572355191, "loss": 0.0119, "step": 81380 }, { "epoch": 0.88, "learning_rate": 0.000168019069857949, "loss": 0.0137, "step": 81390 }, { "epoch": 0.88, "learning_rate": 0.0001680028539923461, "loss": 0.0108, "step": 81400 }, { "epoch": 0.88, "learning_rate": 0.0001679866381267432, "loss": 0.0107, "step": 81410 }, { "epoch": 0.88, "learning_rate": 0.00016797042226114029, "loss": 0.0115, "step": 81420 }, { "epoch": 0.88, "learning_rate": 0.0001679542063955374, "loss": 0.0162, "step": 81430 }, { "epoch": 0.88, "learning_rate": 0.00016793799052993447, "loss": 0.0145, "step": 81440 }, { "epoch": 0.88, "learning_rate": 0.00016792177466433156, "loss": 0.0156, "step": 81450 }, { "epoch": 0.88, "learning_rate": 0.00016790555879872866, "loss": 0.0126, "step": 81460 }, { "epoch": 0.88, "learning_rate": 0.00016788934293312578, "loss": 0.0134, "step": 81470 }, { "epoch": 0.88, "learning_rate": 0.00016787312706752284, "loss": 0.0139, "step": 81480 }, { "epoch": 0.88, "learning_rate": 0.00016785691120191993, "loss": 0.0154, "step": 81490 }, { "epoch": 0.88, "learning_rate": 0.00016784069533631705, "loss": 0.0113, "step": 81500 }, { "epoch": 0.88, "learning_rate": 0.00016782447947071415, "loss": 0.0113, "step": 81510 }, { "epoch": 0.88, "learning_rate": 0.0001678082636051112, "loss": 0.0158, "step": 81520 }, { "epoch": 0.88, "learning_rate": 0.0001677920477395083, "loss": 0.0143, "step": 81530 }, { "epoch": 0.88, "learning_rate": 0.00016777583187390543, "loss": 0.0122, "step": 81540 }, { "epoch": 0.88, "learning_rate": 0.00016775961600830252, "loss": 0.0145, "step": 81550 }, { "epoch": 0.88, "learning_rate": 0.00016774340014269958, "loss": 0.0132, "step": 81560 }, { "epoch": 0.88, "learning_rate": 0.0001677271842770967, "loss": 0.0107, "step": 81570 }, { "epoch": 0.88, "learning_rate": 0.0001677109684114938, "loss": 0.0176, "step": 81580 }, { "epoch": 0.88, "learning_rate": 0.0001676947525458909, "loss": 0.0117, "step": 81590 }, { "epoch": 0.88, "learning_rate": 0.00016767853668028795, "loss": 0.0139, "step": 81600 }, { "epoch": 0.88, "learning_rate": 0.00016766232081468507, "loss": 0.0135, "step": 81610 }, { "epoch": 0.88, "learning_rate": 0.00016764610494908217, "loss": 0.0136, "step": 81620 }, { "epoch": 0.88, "learning_rate": 0.0001676298890834793, "loss": 0.0197, "step": 81630 }, { "epoch": 0.88, "learning_rate": 0.00016761367321787635, "loss": 0.015, "step": 81640 }, { "epoch": 0.88, "learning_rate": 0.00016759745735227345, "loss": 0.0127, "step": 81650 }, { "epoch": 0.88, "learning_rate": 0.00016758124148667054, "loss": 0.014, "step": 81660 }, { "epoch": 0.88, "learning_rate": 0.00016756502562106766, "loss": 0.015, "step": 81670 }, { "epoch": 0.88, "learning_rate": 0.00016754880975546472, "loss": 0.0127, "step": 81680 }, { "epoch": 0.88, "learning_rate": 0.00016753259388986182, "loss": 0.013, "step": 81690 }, { "epoch": 0.88, "learning_rate": 0.00016751637802425894, "loss": 0.0135, "step": 81700 }, { "epoch": 0.88, "learning_rate": 0.00016750016215865603, "loss": 0.0137, "step": 81710 }, { "epoch": 0.88, "learning_rate": 0.0001674839462930531, "loss": 0.0146, "step": 81720 }, { "epoch": 0.88, "learning_rate": 0.0001674677304274502, "loss": 0.0191, "step": 81730 }, { "epoch": 0.88, "learning_rate": 0.0001674515145618473, "loss": 0.0152, "step": 81740 }, { "epoch": 0.88, "learning_rate": 0.0001674352986962444, "loss": 0.0116, "step": 81750 }, { "epoch": 0.88, "learning_rate": 0.00016741908283064147, "loss": 0.0171, "step": 81760 }, { "epoch": 0.88, "learning_rate": 0.00016740286696503859, "loss": 0.0124, "step": 81770 }, { "epoch": 0.88, "learning_rate": 0.00016738665109943568, "loss": 0.0125, "step": 81780 }, { "epoch": 0.88, "learning_rate": 0.00016737043523383277, "loss": 0.0115, "step": 81790 }, { "epoch": 0.88, "learning_rate": 0.00016735421936822984, "loss": 0.013, "step": 81800 }, { "epoch": 0.88, "learning_rate": 0.00016733800350262696, "loss": 0.0137, "step": 81810 }, { "epoch": 0.88, "learning_rate": 0.00016732178763702405, "loss": 0.0142, "step": 81820 }, { "epoch": 0.88, "learning_rate": 0.00016730557177142114, "loss": 0.0124, "step": 81830 }, { "epoch": 0.88, "learning_rate": 0.00016728935590581823, "loss": 0.0124, "step": 81840 }, { "epoch": 0.88, "learning_rate": 0.00016727314004021533, "loss": 0.0134, "step": 81850 }, { "epoch": 0.88, "learning_rate": 0.00016725692417461242, "loss": 0.0135, "step": 81860 }, { "epoch": 0.89, "learning_rate": 0.00016724070830900954, "loss": 0.0139, "step": 81870 }, { "epoch": 0.89, "learning_rate": 0.0001672244924434066, "loss": 0.0106, "step": 81880 }, { "epoch": 0.89, "learning_rate": 0.0001672082765778037, "loss": 0.0172, "step": 81890 }, { "epoch": 0.89, "learning_rate": 0.0001671920607122008, "loss": 0.0129, "step": 81900 }, { "epoch": 0.89, "learning_rate": 0.0001671758448465979, "loss": 0.0136, "step": 81910 }, { "epoch": 0.89, "learning_rate": 0.00016715962898099498, "loss": 0.0154, "step": 81920 }, { "epoch": 0.89, "learning_rate": 0.00016714341311539207, "loss": 0.011, "step": 81930 }, { "epoch": 0.89, "learning_rate": 0.0001671271972497892, "loss": 0.011, "step": 81940 }, { "epoch": 0.89, "learning_rate": 0.00016711098138418628, "loss": 0.0153, "step": 81950 }, { "epoch": 0.89, "learning_rate": 0.00016709476551858335, "loss": 0.0128, "step": 81960 }, { "epoch": 0.89, "learning_rate": 0.00016707854965298044, "loss": 0.015, "step": 81970 }, { "epoch": 0.89, "learning_rate": 0.00016706233378737756, "loss": 0.0132, "step": 81980 }, { "epoch": 0.89, "learning_rate": 0.00016704611792177465, "loss": 0.0192, "step": 81990 }, { "epoch": 0.89, "learning_rate": 0.00016702990205617172, "loss": 0.0154, "step": 82000 }, { "epoch": 0.89, "eval_cer": 0.9215382263475072, "eval_loss": 0.009874101728200912, "eval_runtime": 121.2944, "eval_samples_per_second": 16.489, "eval_steps_per_second": 4.122, "step": 82000 }, { "epoch": 0.89, "learning_rate": 0.00016701368619056884, "loss": 0.0153, "step": 82010 }, { "epoch": 0.89, "learning_rate": 0.00016699747032496593, "loss": 0.0194, "step": 82020 }, { "epoch": 0.89, "learning_rate": 0.00016698125445936302, "loss": 0.0155, "step": 82030 }, { "epoch": 0.89, "learning_rate": 0.00016696503859376014, "loss": 0.0133, "step": 82040 }, { "epoch": 0.89, "learning_rate": 0.0001669488227281572, "loss": 0.0133, "step": 82050 }, { "epoch": 0.89, "learning_rate": 0.0001669326068625543, "loss": 0.0125, "step": 82060 }, { "epoch": 0.89, "learning_rate": 0.00016691639099695142, "loss": 0.0139, "step": 82070 }, { "epoch": 0.89, "learning_rate": 0.00016690017513134851, "loss": 0.0143, "step": 82080 }, { "epoch": 0.89, "learning_rate": 0.00016688395926574558, "loss": 0.0156, "step": 82090 }, { "epoch": 0.89, "learning_rate": 0.00016686774340014267, "loss": 0.0113, "step": 82100 }, { "epoch": 0.89, "learning_rate": 0.0001668515275345398, "loss": 0.0132, "step": 82110 }, { "epoch": 0.89, "learning_rate": 0.00016683531166893689, "loss": 0.013, "step": 82120 }, { "epoch": 0.89, "learning_rate": 0.00016681909580333395, "loss": 0.0157, "step": 82130 }, { "epoch": 0.89, "learning_rate": 0.00016680287993773107, "loss": 0.0108, "step": 82140 }, { "epoch": 0.89, "learning_rate": 0.00016678666407212816, "loss": 0.0118, "step": 82150 }, { "epoch": 0.89, "learning_rate": 0.00016677044820652526, "loss": 0.0152, "step": 82160 }, { "epoch": 0.89, "learning_rate": 0.00016675423234092232, "loss": 0.0161, "step": 82170 }, { "epoch": 0.89, "learning_rate": 0.00016673801647531944, "loss": 0.0125, "step": 82180 }, { "epoch": 0.89, "learning_rate": 0.00016672180060971653, "loss": 0.0135, "step": 82190 }, { "epoch": 0.89, "learning_rate": 0.00016670558474411363, "loss": 0.0138, "step": 82200 }, { "epoch": 0.89, "learning_rate": 0.00016668936887851072, "loss": 0.0109, "step": 82210 }, { "epoch": 0.89, "learning_rate": 0.0001666731530129078, "loss": 0.0119, "step": 82220 }, { "epoch": 0.89, "learning_rate": 0.0001666569371473049, "loss": 0.0122, "step": 82230 }, { "epoch": 0.89, "learning_rate": 0.00016664072128170203, "loss": 0.0133, "step": 82240 }, { "epoch": 0.89, "learning_rate": 0.0001666245054160991, "loss": 0.014, "step": 82250 }, { "epoch": 0.89, "learning_rate": 0.00016660828955049618, "loss": 0.0136, "step": 82260 }, { "epoch": 0.89, "learning_rate": 0.00016659207368489328, "loss": 0.012, "step": 82270 }, { "epoch": 0.89, "learning_rate": 0.0001665758578192904, "loss": 0.0129, "step": 82280 }, { "epoch": 0.89, "learning_rate": 0.00016655964195368746, "loss": 0.0156, "step": 82290 }, { "epoch": 0.89, "learning_rate": 0.00016654342608808456, "loss": 0.0141, "step": 82300 }, { "epoch": 0.89, "learning_rate": 0.00016652721022248167, "loss": 0.0141, "step": 82310 }, { "epoch": 0.89, "learning_rate": 0.00016651099435687877, "loss": 0.0138, "step": 82320 }, { "epoch": 0.89, "learning_rate": 0.00016649477849127583, "loss": 0.0137, "step": 82330 }, { "epoch": 0.89, "learning_rate": 0.00016647856262567295, "loss": 0.0156, "step": 82340 }, { "epoch": 0.89, "learning_rate": 0.00016646234676007005, "loss": 0.0129, "step": 82350 }, { "epoch": 0.89, "learning_rate": 0.00016644613089446714, "loss": 0.0145, "step": 82360 }, { "epoch": 0.89, "learning_rate": 0.0001664299150288642, "loss": 0.0155, "step": 82370 }, { "epoch": 0.89, "learning_rate": 0.00016641369916326132, "loss": 0.0158, "step": 82380 }, { "epoch": 0.89, "learning_rate": 0.00016639748329765842, "loss": 0.0153, "step": 82390 }, { "epoch": 0.89, "learning_rate": 0.0001663812674320555, "loss": 0.0144, "step": 82400 }, { "epoch": 0.89, "learning_rate": 0.0001663650515664526, "loss": 0.0172, "step": 82410 }, { "epoch": 0.89, "learning_rate": 0.0001663488357008497, "loss": 0.0111, "step": 82420 }, { "epoch": 0.89, "learning_rate": 0.0001663326198352468, "loss": 0.0123, "step": 82430 }, { "epoch": 0.89, "learning_rate": 0.0001663164039696439, "loss": 0.0122, "step": 82440 }, { "epoch": 0.89, "learning_rate": 0.00016630018810404097, "loss": 0.0148, "step": 82450 }, { "epoch": 0.89, "learning_rate": 0.00016628397223843807, "loss": 0.0127, "step": 82460 }, { "epoch": 0.89, "learning_rate": 0.00016626775637283516, "loss": 0.0134, "step": 82470 }, { "epoch": 0.89, "learning_rate": 0.00016625154050723228, "loss": 0.0139, "step": 82480 }, { "epoch": 0.89, "learning_rate": 0.00016623532464162934, "loss": 0.0112, "step": 82490 }, { "epoch": 0.89, "learning_rate": 0.00016621910877602644, "loss": 0.0132, "step": 82500 }, { "epoch": 0.89, "learning_rate": 0.00016620289291042356, "loss": 0.0122, "step": 82510 }, { "epoch": 0.89, "learning_rate": 0.00016618667704482065, "loss": 0.0158, "step": 82520 }, { "epoch": 0.89, "learning_rate": 0.00016617046117921772, "loss": 0.0165, "step": 82530 }, { "epoch": 0.89, "learning_rate": 0.0001661542453136148, "loss": 0.0122, "step": 82540 }, { "epoch": 0.89, "learning_rate": 0.00016613802944801193, "loss": 0.0115, "step": 82550 }, { "epoch": 0.89, "learning_rate": 0.00016612181358240902, "loss": 0.0146, "step": 82560 }, { "epoch": 0.89, "learning_rate": 0.00016610559771680609, "loss": 0.013, "step": 82570 }, { "epoch": 0.89, "learning_rate": 0.0001660893818512032, "loss": 0.0147, "step": 82580 }, { "epoch": 0.89, "learning_rate": 0.0001660731659856003, "loss": 0.0124, "step": 82590 }, { "epoch": 0.89, "learning_rate": 0.0001660569501199974, "loss": 0.0139, "step": 82600 }, { "epoch": 0.89, "learning_rate": 0.00016604073425439446, "loss": 0.0153, "step": 82610 }, { "epoch": 0.89, "learning_rate": 0.00016602451838879158, "loss": 0.0185, "step": 82620 }, { "epoch": 0.89, "learning_rate": 0.00016600830252318867, "loss": 0.0131, "step": 82630 }, { "epoch": 0.89, "learning_rate": 0.0001659920866575858, "loss": 0.0135, "step": 82640 }, { "epoch": 0.89, "learning_rate": 0.00016597587079198286, "loss": 0.0139, "step": 82650 }, { "epoch": 0.89, "learning_rate": 0.00016595965492637995, "loss": 0.0123, "step": 82660 }, { "epoch": 0.89, "learning_rate": 0.00016594343906077704, "loss": 0.0134, "step": 82670 }, { "epoch": 0.89, "learning_rate": 0.00016592722319517416, "loss": 0.012, "step": 82680 }, { "epoch": 0.89, "learning_rate": 0.00016591100732957123, "loss": 0.0169, "step": 82690 }, { "epoch": 0.89, "learning_rate": 0.00016589479146396832, "loss": 0.0134, "step": 82700 }, { "epoch": 0.89, "learning_rate": 0.00016587857559836544, "loss": 0.0124, "step": 82710 }, { "epoch": 0.89, "learning_rate": 0.00016586235973276253, "loss": 0.0115, "step": 82720 }, { "epoch": 0.89, "learning_rate": 0.00016584614386715962, "loss": 0.0134, "step": 82730 }, { "epoch": 0.89, "learning_rate": 0.0001658299280015567, "loss": 0.0105, "step": 82740 }, { "epoch": 0.89, "learning_rate": 0.0001658137121359538, "loss": 0.0115, "step": 82750 }, { "epoch": 0.89, "learning_rate": 0.0001657974962703509, "loss": 0.0135, "step": 82760 }, { "epoch": 0.89, "learning_rate": 0.000165781280404748, "loss": 0.0135, "step": 82770 }, { "epoch": 0.89, "learning_rate": 0.0001657650645391451, "loss": 0.0147, "step": 82780 }, { "epoch": 0.9, "learning_rate": 0.00016574884867354218, "loss": 0.0161, "step": 82790 }, { "epoch": 0.9, "learning_rate": 0.00016573263280793927, "loss": 0.0132, "step": 82800 }, { "epoch": 0.9, "learning_rate": 0.0001657164169423364, "loss": 0.0126, "step": 82810 }, { "epoch": 0.9, "learning_rate": 0.00016570020107673346, "loss": 0.0137, "step": 82820 }, { "epoch": 0.9, "learning_rate": 0.00016568398521113055, "loss": 0.0119, "step": 82830 }, { "epoch": 0.9, "learning_rate": 0.00016566776934552764, "loss": 0.0103, "step": 82840 }, { "epoch": 0.9, "learning_rate": 0.00016565155347992476, "loss": 0.0124, "step": 82850 }, { "epoch": 0.9, "learning_rate": 0.00016563533761432183, "loss": 0.0154, "step": 82860 }, { "epoch": 0.9, "learning_rate": 0.00016561912174871892, "loss": 0.0129, "step": 82870 }, { "epoch": 0.9, "learning_rate": 0.00016560290588311604, "loss": 0.0134, "step": 82880 }, { "epoch": 0.9, "learning_rate": 0.00016558669001751314, "loss": 0.0145, "step": 82890 }, { "epoch": 0.9, "learning_rate": 0.0001655704741519102, "loss": 0.0138, "step": 82900 }, { "epoch": 0.9, "learning_rate": 0.0001655542582863073, "loss": 0.0159, "step": 82910 }, { "epoch": 0.9, "learning_rate": 0.00016553804242070441, "loss": 0.0153, "step": 82920 }, { "epoch": 0.9, "learning_rate": 0.0001655218265551015, "loss": 0.0162, "step": 82930 }, { "epoch": 0.9, "learning_rate": 0.00016550561068949857, "loss": 0.014, "step": 82940 }, { "epoch": 0.9, "learning_rate": 0.0001654893948238957, "loss": 0.0157, "step": 82950 }, { "epoch": 0.9, "learning_rate": 0.00016547317895829278, "loss": 0.0148, "step": 82960 }, { "epoch": 0.9, "learning_rate": 0.00016545696309268988, "loss": 0.0125, "step": 82970 }, { "epoch": 0.9, "learning_rate": 0.00016544074722708694, "loss": 0.0152, "step": 82980 }, { "epoch": 0.9, "learning_rate": 0.00016542453136148406, "loss": 0.0164, "step": 82990 }, { "epoch": 0.9, "learning_rate": 0.00016540831549588116, "loss": 0.0129, "step": 83000 }, { "epoch": 0.9, "eval_cer": 0.9215286717149871, "eval_loss": 0.00943547859787941, "eval_runtime": 121.1193, "eval_samples_per_second": 16.513, "eval_steps_per_second": 4.128, "step": 83000 }, { "epoch": 0.9, "learning_rate": 0.00016539209963027828, "loss": 0.0115, "step": 83010 }, { "epoch": 0.9, "learning_rate": 0.00016537588376467534, "loss": 0.0143, "step": 83020 }, { "epoch": 0.9, "learning_rate": 0.00016535966789907243, "loss": 0.0138, "step": 83030 }, { "epoch": 0.9, "learning_rate": 0.00016534345203346953, "loss": 0.0113, "step": 83040 }, { "epoch": 0.9, "learning_rate": 0.00016532723616786665, "loss": 0.011, "step": 83050 }, { "epoch": 0.9, "learning_rate": 0.0001653110203022637, "loss": 0.0095, "step": 83060 }, { "epoch": 0.9, "learning_rate": 0.0001652948044366608, "loss": 0.0114, "step": 83070 }, { "epoch": 0.9, "learning_rate": 0.00016527858857105792, "loss": 0.0138, "step": 83080 }, { "epoch": 0.9, "learning_rate": 0.00016526237270545502, "loss": 0.0116, "step": 83090 }, { "epoch": 0.9, "learning_rate": 0.00016524615683985208, "loss": 0.0136, "step": 83100 }, { "epoch": 0.9, "learning_rate": 0.00016522994097424918, "loss": 0.0137, "step": 83110 }, { "epoch": 0.9, "learning_rate": 0.0001652137251086463, "loss": 0.0101, "step": 83120 }, { "epoch": 0.9, "learning_rate": 0.0001651975092430434, "loss": 0.0125, "step": 83130 }, { "epoch": 0.9, "learning_rate": 0.00016518129337744045, "loss": 0.0116, "step": 83140 }, { "epoch": 0.9, "learning_rate": 0.00016516507751183757, "loss": 0.0133, "step": 83150 }, { "epoch": 0.9, "learning_rate": 0.00016514886164623467, "loss": 0.0102, "step": 83160 }, { "epoch": 0.9, "learning_rate": 0.00016513264578063176, "loss": 0.0135, "step": 83170 }, { "epoch": 0.9, "learning_rate": 0.00016511642991502882, "loss": 0.0153, "step": 83180 }, { "epoch": 0.9, "learning_rate": 0.00016510021404942594, "loss": 0.013, "step": 83190 }, { "epoch": 0.9, "learning_rate": 0.00016508399818382304, "loss": 0.013, "step": 83200 }, { "epoch": 0.9, "learning_rate": 0.00016506778231822013, "loss": 0.0151, "step": 83210 }, { "epoch": 0.9, "learning_rate": 0.00016505156645261722, "loss": 0.0149, "step": 83220 }, { "epoch": 0.9, "learning_rate": 0.00016503535058701432, "loss": 0.0107, "step": 83230 }, { "epoch": 0.9, "learning_rate": 0.0001650191347214114, "loss": 0.0115, "step": 83240 }, { "epoch": 0.9, "learning_rate": 0.00016500291885580853, "loss": 0.0135, "step": 83250 }, { "epoch": 0.9, "learning_rate": 0.0001649867029902056, "loss": 0.013, "step": 83260 }, { "epoch": 0.9, "learning_rate": 0.0001649704871246027, "loss": 0.0128, "step": 83270 }, { "epoch": 0.9, "learning_rate": 0.00016495427125899978, "loss": 0.0136, "step": 83280 }, { "epoch": 0.9, "learning_rate": 0.0001649380553933969, "loss": 0.0136, "step": 83290 }, { "epoch": 0.9, "learning_rate": 0.00016492183952779396, "loss": 0.015, "step": 83300 }, { "epoch": 0.9, "learning_rate": 0.00016490562366219106, "loss": 0.0123, "step": 83310 }, { "epoch": 0.9, "learning_rate": 0.00016488940779658818, "loss": 0.0134, "step": 83320 }, { "epoch": 0.9, "learning_rate": 0.00016487319193098527, "loss": 0.013, "step": 83330 }, { "epoch": 0.9, "learning_rate": 0.00016485697606538234, "loss": 0.0149, "step": 83340 }, { "epoch": 0.9, "learning_rate": 0.00016484076019977946, "loss": 0.0104, "step": 83350 }, { "epoch": 0.9, "learning_rate": 0.00016482454433417655, "loss": 0.0131, "step": 83360 }, { "epoch": 0.9, "learning_rate": 0.00016480832846857364, "loss": 0.0134, "step": 83370 }, { "epoch": 0.9, "learning_rate": 0.0001647921126029707, "loss": 0.0124, "step": 83380 }, { "epoch": 0.9, "learning_rate": 0.00016477589673736783, "loss": 0.0156, "step": 83390 }, { "epoch": 0.9, "learning_rate": 0.00016475968087176492, "loss": 0.0135, "step": 83400 }, { "epoch": 0.9, "learning_rate": 0.000164743465006162, "loss": 0.0127, "step": 83410 }, { "epoch": 0.9, "learning_rate": 0.0001647272491405591, "loss": 0.0099, "step": 83420 }, { "epoch": 0.9, "learning_rate": 0.0001647110332749562, "loss": 0.0143, "step": 83430 }, { "epoch": 0.9, "learning_rate": 0.0001646948174093533, "loss": 0.0131, "step": 83440 }, { "epoch": 0.9, "learning_rate": 0.0001646786015437504, "loss": 0.0124, "step": 83450 }, { "epoch": 0.9, "learning_rate": 0.0001646623856781475, "loss": 0.0136, "step": 83460 }, { "epoch": 0.9, "learning_rate": 0.00016464616981254457, "loss": 0.0106, "step": 83470 }, { "epoch": 0.9, "learning_rate": 0.00016462995394694166, "loss": 0.0146, "step": 83480 }, { "epoch": 0.9, "learning_rate": 0.00016461373808133878, "loss": 0.0152, "step": 83490 }, { "epoch": 0.9, "learning_rate": 0.00016459752221573587, "loss": 0.0165, "step": 83500 }, { "epoch": 0.9, "learning_rate": 0.00016458130635013294, "loss": 0.0151, "step": 83510 }, { "epoch": 0.9, "learning_rate": 0.00016456509048453006, "loss": 0.0157, "step": 83520 }, { "epoch": 0.9, "learning_rate": 0.00016454887461892715, "loss": 0.0124, "step": 83530 }, { "epoch": 0.9, "learning_rate": 0.00016453265875332425, "loss": 0.0122, "step": 83540 }, { "epoch": 0.9, "learning_rate": 0.0001645164428877213, "loss": 0.0127, "step": 83550 }, { "epoch": 0.9, "learning_rate": 0.00016450022702211843, "loss": 0.0136, "step": 83560 }, { "epoch": 0.9, "learning_rate": 0.00016448401115651552, "loss": 0.0138, "step": 83570 }, { "epoch": 0.9, "learning_rate": 0.00016446779529091262, "loss": 0.0126, "step": 83580 }, { "epoch": 0.9, "learning_rate": 0.0001644515794253097, "loss": 0.0124, "step": 83590 }, { "epoch": 0.9, "learning_rate": 0.0001644353635597068, "loss": 0.0121, "step": 83600 }, { "epoch": 0.9, "learning_rate": 0.0001644191476941039, "loss": 0.0126, "step": 83610 }, { "epoch": 0.9, "learning_rate": 0.00016440293182850101, "loss": 0.014, "step": 83620 }, { "epoch": 0.9, "learning_rate": 0.00016438671596289808, "loss": 0.0134, "step": 83630 }, { "epoch": 0.9, "learning_rate": 0.00016437050009729517, "loss": 0.0177, "step": 83640 }, { "epoch": 0.9, "learning_rate": 0.0001643542842316923, "loss": 0.0172, "step": 83650 }, { "epoch": 0.9, "learning_rate": 0.00016433806836608939, "loss": 0.0127, "step": 83660 }, { "epoch": 0.9, "learning_rate": 0.00016432185250048645, "loss": 0.0115, "step": 83670 }, { "epoch": 0.9, "learning_rate": 0.00016430563663488354, "loss": 0.0129, "step": 83680 }, { "epoch": 0.9, "learning_rate": 0.00016428942076928066, "loss": 0.0153, "step": 83690 }, { "epoch": 0.9, "learning_rate": 0.00016427320490367776, "loss": 0.0156, "step": 83700 }, { "epoch": 0.9, "learning_rate": 0.00016425698903807482, "loss": 0.0117, "step": 83710 }, { "epoch": 0.91, "learning_rate": 0.00016424077317247194, "loss": 0.0128, "step": 83720 }, { "epoch": 0.91, "learning_rate": 0.00016422455730686903, "loss": 0.0163, "step": 83730 }, { "epoch": 0.91, "learning_rate": 0.00016420834144126613, "loss": 0.0128, "step": 83740 }, { "epoch": 0.91, "learning_rate": 0.0001641921255756632, "loss": 0.0117, "step": 83750 }, { "epoch": 0.91, "learning_rate": 0.0001641759097100603, "loss": 0.0128, "step": 83760 }, { "epoch": 0.91, "learning_rate": 0.0001641596938444574, "loss": 0.0121, "step": 83770 }, { "epoch": 0.91, "learning_rate": 0.0001641434779788545, "loss": 0.0113, "step": 83780 }, { "epoch": 0.91, "learning_rate": 0.0001641272621132516, "loss": 0.0137, "step": 83790 }, { "epoch": 0.91, "learning_rate": 0.00016411104624764868, "loss": 0.0178, "step": 83800 }, { "epoch": 0.91, "learning_rate": 0.00016409483038204578, "loss": 0.0135, "step": 83810 }, { "epoch": 0.91, "learning_rate": 0.0001640786145164429, "loss": 0.0183, "step": 83820 }, { "epoch": 0.91, "learning_rate": 0.00016406239865083996, "loss": 0.0118, "step": 83830 }, { "epoch": 0.91, "learning_rate": 0.00016404618278523705, "loss": 0.0123, "step": 83840 }, { "epoch": 0.91, "learning_rate": 0.00016402996691963415, "loss": 0.0147, "step": 83850 }, { "epoch": 0.91, "learning_rate": 0.00016401375105403127, "loss": 0.0147, "step": 83860 }, { "epoch": 0.91, "learning_rate": 0.00016399753518842833, "loss": 0.0113, "step": 83870 }, { "epoch": 0.91, "learning_rate": 0.00016398131932282543, "loss": 0.0143, "step": 83880 }, { "epoch": 0.91, "learning_rate": 0.00016396510345722255, "loss": 0.0132, "step": 83890 }, { "epoch": 0.91, "learning_rate": 0.00016394888759161964, "loss": 0.0125, "step": 83900 }, { "epoch": 0.91, "learning_rate": 0.0001639326717260167, "loss": 0.0136, "step": 83910 }, { "epoch": 0.91, "learning_rate": 0.0001639164558604138, "loss": 0.0164, "step": 83920 }, { "epoch": 0.91, "learning_rate": 0.00016390023999481092, "loss": 0.0114, "step": 83930 }, { "epoch": 0.91, "learning_rate": 0.000163884024129208, "loss": 0.0126, "step": 83940 }, { "epoch": 0.91, "learning_rate": 0.00016386780826360507, "loss": 0.0171, "step": 83950 }, { "epoch": 0.91, "learning_rate": 0.0001638515923980022, "loss": 0.0098, "step": 83960 }, { "epoch": 0.91, "learning_rate": 0.0001638353765323993, "loss": 0.0137, "step": 83970 }, { "epoch": 0.91, "learning_rate": 0.00016381916066679638, "loss": 0.0134, "step": 83980 }, { "epoch": 0.91, "learning_rate": 0.00016380294480119345, "loss": 0.0156, "step": 83990 }, { "epoch": 0.91, "learning_rate": 0.00016378672893559057, "loss": 0.0125, "step": 84000 }, { "epoch": 0.91, "eval_cer": 0.9215373577445508, "eval_loss": 0.009720318019390106, "eval_runtime": 121.0619, "eval_samples_per_second": 16.52, "eval_steps_per_second": 4.13, "step": 84000 }, { "epoch": 0.91, "learning_rate": 0.00016377051306998766, "loss": 0.0153, "step": 84010 }, { "epoch": 0.91, "learning_rate": 0.00016375429720438478, "loss": 0.0099, "step": 84020 }, { "epoch": 0.91, "learning_rate": 0.00016373808133878184, "loss": 0.0113, "step": 84030 }, { "epoch": 0.91, "learning_rate": 0.00016372186547317894, "loss": 0.0132, "step": 84040 }, { "epoch": 0.91, "learning_rate": 0.00016370564960757603, "loss": 0.0151, "step": 84050 }, { "epoch": 0.91, "learning_rate": 0.00016368943374197315, "loss": 0.0133, "step": 84060 }, { "epoch": 0.91, "learning_rate": 0.00016367321787637021, "loss": 0.0131, "step": 84070 }, { "epoch": 0.91, "learning_rate": 0.0001636570020107673, "loss": 0.0113, "step": 84080 }, { "epoch": 0.91, "learning_rate": 0.00016364078614516443, "loss": 0.0127, "step": 84090 }, { "epoch": 0.91, "learning_rate": 0.00016362457027956152, "loss": 0.0146, "step": 84100 }, { "epoch": 0.91, "learning_rate": 0.00016360835441395859, "loss": 0.0146, "step": 84110 }, { "epoch": 0.91, "learning_rate": 0.00016359213854835568, "loss": 0.0148, "step": 84120 }, { "epoch": 0.91, "learning_rate": 0.0001635759226827528, "loss": 0.0134, "step": 84130 }, { "epoch": 0.91, "learning_rate": 0.0001635597068171499, "loss": 0.0131, "step": 84140 }, { "epoch": 0.91, "learning_rate": 0.00016354349095154696, "loss": 0.0117, "step": 84150 }, { "epoch": 0.91, "learning_rate": 0.00016352727508594408, "loss": 0.0134, "step": 84160 }, { "epoch": 0.91, "learning_rate": 0.00016351105922034117, "loss": 0.0125, "step": 84170 }, { "epoch": 0.91, "learning_rate": 0.00016349484335473826, "loss": 0.0141, "step": 84180 }, { "epoch": 0.91, "learning_rate": 0.00016347862748913538, "loss": 0.0155, "step": 84190 }, { "epoch": 0.91, "learning_rate": 0.00016346241162353245, "loss": 0.0107, "step": 84200 }, { "epoch": 0.91, "learning_rate": 0.00016344619575792954, "loss": 0.015, "step": 84210 }, { "epoch": 0.91, "learning_rate": 0.00016342997989232663, "loss": 0.0118, "step": 84220 }, { "epoch": 0.91, "learning_rate": 0.00016341376402672375, "loss": 0.0131, "step": 84230 }, { "epoch": 0.91, "learning_rate": 0.00016339754816112082, "loss": 0.0137, "step": 84240 }, { "epoch": 0.91, "learning_rate": 0.0001633813322955179, "loss": 0.0129, "step": 84250 }, { "epoch": 0.91, "learning_rate": 0.00016336511642991503, "loss": 0.0113, "step": 84260 }, { "epoch": 0.91, "learning_rate": 0.00016334890056431212, "loss": 0.0114, "step": 84270 }, { "epoch": 0.91, "learning_rate": 0.0001633326846987092, "loss": 0.0121, "step": 84280 }, { "epoch": 0.91, "learning_rate": 0.00016331646883310628, "loss": 0.0102, "step": 84290 }, { "epoch": 0.91, "learning_rate": 0.0001633002529675034, "loss": 0.0107, "step": 84300 }, { "epoch": 0.91, "learning_rate": 0.0001632840371019005, "loss": 0.012, "step": 84310 }, { "epoch": 0.91, "learning_rate": 0.00016326782123629756, "loss": 0.012, "step": 84320 }, { "epoch": 0.91, "learning_rate": 0.00016325160537069468, "loss": 0.0126, "step": 84330 }, { "epoch": 0.91, "learning_rate": 0.00016323538950509177, "loss": 0.0118, "step": 84340 }, { "epoch": 0.91, "learning_rate": 0.00016321917363948887, "loss": 0.0114, "step": 84350 }, { "epoch": 0.91, "learning_rate": 0.00016320295777388596, "loss": 0.0101, "step": 84360 }, { "epoch": 0.91, "learning_rate": 0.00016318674190828305, "loss": 0.0134, "step": 84370 }, { "epoch": 0.91, "learning_rate": 0.00016317052604268014, "loss": 0.0099, "step": 84380 }, { "epoch": 0.91, "learning_rate": 0.00016315431017707726, "loss": 0.0137, "step": 84390 }, { "epoch": 0.91, "learning_rate": 0.00016313809431147433, "loss": 0.0144, "step": 84400 }, { "epoch": 0.91, "learning_rate": 0.00016312187844587142, "loss": 0.0135, "step": 84410 }, { "epoch": 0.91, "learning_rate": 0.00016310566258026851, "loss": 0.0108, "step": 84420 }, { "epoch": 0.91, "learning_rate": 0.00016308944671466563, "loss": 0.0115, "step": 84430 }, { "epoch": 0.91, "learning_rate": 0.0001630732308490627, "loss": 0.0107, "step": 84440 }, { "epoch": 0.91, "learning_rate": 0.0001630570149834598, "loss": 0.0119, "step": 84450 }, { "epoch": 0.91, "learning_rate": 0.0001630407991178569, "loss": 0.0116, "step": 84460 }, { "epoch": 0.91, "learning_rate": 0.000163024583252254, "loss": 0.0117, "step": 84470 }, { "epoch": 0.91, "learning_rate": 0.00016300836738665107, "loss": 0.0146, "step": 84480 }, { "epoch": 0.91, "learning_rate": 0.00016299215152104816, "loss": 0.0113, "step": 84490 }, { "epoch": 0.91, "learning_rate": 0.00016297593565544528, "loss": 0.0125, "step": 84500 }, { "epoch": 0.91, "learning_rate": 0.00016295971978984238, "loss": 0.0126, "step": 84510 }, { "epoch": 0.91, "learning_rate": 0.00016294350392423944, "loss": 0.0132, "step": 84520 }, { "epoch": 0.91, "learning_rate": 0.00016292728805863656, "loss": 0.0111, "step": 84530 }, { "epoch": 0.91, "learning_rate": 0.00016291107219303365, "loss": 0.0151, "step": 84540 }, { "epoch": 0.91, "learning_rate": 0.00016289485632743075, "loss": 0.0128, "step": 84550 }, { "epoch": 0.91, "learning_rate": 0.0001628786404618278, "loss": 0.0141, "step": 84560 }, { "epoch": 0.91, "learning_rate": 0.00016286242459622493, "loss": 0.0117, "step": 84570 }, { "epoch": 0.91, "learning_rate": 0.00016284620873062203, "loss": 0.0183, "step": 84580 }, { "epoch": 0.91, "learning_rate": 0.00016282999286501912, "loss": 0.0167, "step": 84590 }, { "epoch": 0.91, "learning_rate": 0.0001628137769994162, "loss": 0.0134, "step": 84600 }, { "epoch": 0.91, "learning_rate": 0.0001627975611338133, "loss": 0.0132, "step": 84610 }, { "epoch": 0.91, "learning_rate": 0.0001627813452682104, "loss": 0.0127, "step": 84620 }, { "epoch": 0.91, "learning_rate": 0.00016276512940260752, "loss": 0.0134, "step": 84630 }, { "epoch": 0.92, "learning_rate": 0.00016274891353700458, "loss": 0.0115, "step": 84640 }, { "epoch": 0.92, "learning_rate": 0.00016273269767140168, "loss": 0.0116, "step": 84650 }, { "epoch": 0.92, "learning_rate": 0.0001627164818057988, "loss": 0.0142, "step": 84660 }, { "epoch": 0.92, "learning_rate": 0.0001627002659401959, "loss": 0.0099, "step": 84670 }, { "epoch": 0.92, "learning_rate": 0.00016268405007459295, "loss": 0.0153, "step": 84680 }, { "epoch": 0.92, "learning_rate": 0.00016266783420899005, "loss": 0.0107, "step": 84690 }, { "epoch": 0.92, "learning_rate": 0.00016265161834338717, "loss": 0.0126, "step": 84700 }, { "epoch": 0.92, "learning_rate": 0.00016263540247778426, "loss": 0.015, "step": 84710 }, { "epoch": 0.92, "learning_rate": 0.00016261918661218132, "loss": 0.0129, "step": 84720 }, { "epoch": 0.92, "learning_rate": 0.00016260297074657844, "loss": 0.0143, "step": 84730 }, { "epoch": 0.92, "learning_rate": 0.00016258675488097554, "loss": 0.014, "step": 84740 }, { "epoch": 0.92, "learning_rate": 0.00016257053901537263, "loss": 0.011, "step": 84750 }, { "epoch": 0.92, "learning_rate": 0.0001625543231497697, "loss": 0.0159, "step": 84760 }, { "epoch": 0.92, "learning_rate": 0.00016253810728416682, "loss": 0.0104, "step": 84770 }, { "epoch": 0.92, "learning_rate": 0.0001625218914185639, "loss": 0.0118, "step": 84780 }, { "epoch": 0.92, "learning_rate": 0.000162505675552961, "loss": 0.0111, "step": 84790 }, { "epoch": 0.92, "learning_rate": 0.0001624894596873581, "loss": 0.0122, "step": 84800 }, { "epoch": 0.92, "learning_rate": 0.00016247324382175519, "loss": 0.0124, "step": 84810 }, { "epoch": 0.92, "learning_rate": 0.00016245702795615228, "loss": 0.0114, "step": 84820 }, { "epoch": 0.92, "learning_rate": 0.0001624408120905494, "loss": 0.0109, "step": 84830 }, { "epoch": 0.92, "learning_rate": 0.00016242459622494646, "loss": 0.011, "step": 84840 }, { "epoch": 0.92, "learning_rate": 0.00016240838035934356, "loss": 0.0155, "step": 84850 }, { "epoch": 0.92, "learning_rate": 0.00016239216449374065, "loss": 0.0159, "step": 84860 }, { "epoch": 0.92, "learning_rate": 0.00016237594862813777, "loss": 0.0107, "step": 84870 }, { "epoch": 0.92, "learning_rate": 0.00016235973276253486, "loss": 0.0111, "step": 84880 }, { "epoch": 0.92, "learning_rate": 0.00016234351689693193, "loss": 0.0122, "step": 84890 }, { "epoch": 0.92, "learning_rate": 0.00016232730103132905, "loss": 0.0123, "step": 84900 }, { "epoch": 0.92, "learning_rate": 0.00016231108516572614, "loss": 0.0139, "step": 84910 }, { "epoch": 0.92, "learning_rate": 0.00016229486930012323, "loss": 0.0136, "step": 84920 }, { "epoch": 0.92, "learning_rate": 0.0001622786534345203, "loss": 0.0127, "step": 84930 }, { "epoch": 0.92, "learning_rate": 0.00016226243756891742, "loss": 0.015, "step": 84940 }, { "epoch": 0.92, "learning_rate": 0.0001622462217033145, "loss": 0.0115, "step": 84950 }, { "epoch": 0.92, "learning_rate": 0.00016223000583771163, "loss": 0.0113, "step": 84960 }, { "epoch": 0.92, "learning_rate": 0.0001622137899721087, "loss": 0.017, "step": 84970 }, { "epoch": 0.92, "learning_rate": 0.0001621975741065058, "loss": 0.0132, "step": 84980 }, { "epoch": 0.92, "learning_rate": 0.00016218135824090288, "loss": 0.014, "step": 84990 }, { "epoch": 0.92, "learning_rate": 0.0001621651423753, "loss": 0.0147, "step": 85000 }, { "epoch": 0.92, "eval_cer": 0.9215269345090743, "eval_loss": 0.00925032515078783, "eval_runtime": 121.1422, "eval_samples_per_second": 16.51, "eval_steps_per_second": 4.127, "step": 85000 }, { "epoch": 0.92, "learning_rate": 0.00016214892650969707, "loss": 0.013, "step": 85010 }, { "epoch": 0.92, "learning_rate": 0.00016213271064409416, "loss": 0.0114, "step": 85020 }, { "epoch": 0.92, "learning_rate": 0.00016211649477849128, "loss": 0.0136, "step": 85030 }, { "epoch": 0.92, "learning_rate": 0.00016210027891288837, "loss": 0.0139, "step": 85040 }, { "epoch": 0.92, "learning_rate": 0.00016208406304728544, "loss": 0.0082, "step": 85050 }, { "epoch": 0.92, "learning_rate": 0.00016206784718168253, "loss": 0.0157, "step": 85060 }, { "epoch": 0.92, "learning_rate": 0.00016205163131607965, "loss": 0.0154, "step": 85070 }, { "epoch": 0.92, "learning_rate": 0.00016203541545047674, "loss": 0.0121, "step": 85080 }, { "epoch": 0.92, "learning_rate": 0.0001620191995848738, "loss": 0.0144, "step": 85090 }, { "epoch": 0.92, "learning_rate": 0.00016200298371927093, "loss": 0.0145, "step": 85100 }, { "epoch": 0.92, "learning_rate": 0.00016198676785366802, "loss": 0.0139, "step": 85110 }, { "epoch": 0.92, "learning_rate": 0.00016197055198806512, "loss": 0.0146, "step": 85120 }, { "epoch": 0.92, "learning_rate": 0.00016195433612246218, "loss": 0.0137, "step": 85130 }, { "epoch": 0.92, "learning_rate": 0.0001619381202568593, "loss": 0.0125, "step": 85140 }, { "epoch": 0.92, "learning_rate": 0.0001619219043912564, "loss": 0.0102, "step": 85150 }, { "epoch": 0.92, "learning_rate": 0.00016190568852565349, "loss": 0.0107, "step": 85160 }, { "epoch": 0.92, "learning_rate": 0.00016188947266005058, "loss": 0.013, "step": 85170 }, { "epoch": 0.92, "learning_rate": 0.00016187325679444767, "loss": 0.0133, "step": 85180 }, { "epoch": 0.92, "learning_rate": 0.00016185704092884476, "loss": 0.0154, "step": 85190 }, { "epoch": 0.92, "learning_rate": 0.00016184082506324188, "loss": 0.0229, "step": 85200 }, { "epoch": 0.92, "learning_rate": 0.00016182460919763895, "loss": 0.012, "step": 85210 }, { "epoch": 0.92, "learning_rate": 0.00016180839333203604, "loss": 0.0111, "step": 85220 }, { "epoch": 0.92, "learning_rate": 0.00016179217746643314, "loss": 0.0114, "step": 85230 }, { "epoch": 0.92, "learning_rate": 0.00016177596160083026, "loss": 0.0127, "step": 85240 }, { "epoch": 0.92, "learning_rate": 0.00016175974573522732, "loss": 0.0139, "step": 85250 }, { "epoch": 0.92, "learning_rate": 0.00016174352986962441, "loss": 0.0109, "step": 85260 }, { "epoch": 0.92, "learning_rate": 0.00016172731400402153, "loss": 0.012, "step": 85270 }, { "epoch": 0.92, "learning_rate": 0.00016171109813841863, "loss": 0.0118, "step": 85280 }, { "epoch": 0.92, "learning_rate": 0.0001616948822728157, "loss": 0.0141, "step": 85290 }, { "epoch": 0.92, "learning_rate": 0.00016167866640721278, "loss": 0.0098, "step": 85300 }, { "epoch": 0.92, "learning_rate": 0.0001616624505416099, "loss": 0.0122, "step": 85310 }, { "epoch": 0.92, "learning_rate": 0.000161646234676007, "loss": 0.0114, "step": 85320 }, { "epoch": 0.92, "learning_rate": 0.00016163001881040406, "loss": 0.0102, "step": 85330 }, { "epoch": 0.92, "learning_rate": 0.00016161380294480118, "loss": 0.0145, "step": 85340 }, { "epoch": 0.92, "learning_rate": 0.00016159758707919828, "loss": 0.0132, "step": 85350 }, { "epoch": 0.92, "learning_rate": 0.00016158137121359537, "loss": 0.0129, "step": 85360 }, { "epoch": 0.92, "learning_rate": 0.00016156515534799246, "loss": 0.0122, "step": 85370 }, { "epoch": 0.92, "learning_rate": 0.00016154893948238955, "loss": 0.0133, "step": 85380 }, { "epoch": 0.92, "learning_rate": 0.00016153272361678665, "loss": 0.0156, "step": 85390 }, { "epoch": 0.92, "learning_rate": 0.00016151650775118377, "loss": 0.0149, "step": 85400 }, { "epoch": 0.92, "learning_rate": 0.00016150029188558083, "loss": 0.0129, "step": 85410 }, { "epoch": 0.92, "learning_rate": 0.00016148407601997792, "loss": 0.0106, "step": 85420 }, { "epoch": 0.92, "learning_rate": 0.00016146786015437502, "loss": 0.0119, "step": 85430 }, { "epoch": 0.92, "learning_rate": 0.00016145164428877214, "loss": 0.0105, "step": 85440 }, { "epoch": 0.92, "learning_rate": 0.0001614354284231692, "loss": 0.0092, "step": 85450 }, { "epoch": 0.92, "learning_rate": 0.0001614192125575663, "loss": 0.0137, "step": 85460 }, { "epoch": 0.92, "learning_rate": 0.00016140299669196342, "loss": 0.013, "step": 85470 }, { "epoch": 0.92, "learning_rate": 0.0001613867808263605, "loss": 0.0103, "step": 85480 }, { "epoch": 0.92, "learning_rate": 0.00016137056496075757, "loss": 0.0116, "step": 85490 }, { "epoch": 0.92, "learning_rate": 0.00016135434909515467, "loss": 0.0127, "step": 85500 }, { "epoch": 0.92, "learning_rate": 0.0001613381332295518, "loss": 0.0167, "step": 85510 }, { "epoch": 0.92, "learning_rate": 0.00016132191736394888, "loss": 0.0144, "step": 85520 }, { "epoch": 0.92, "learning_rate": 0.00016130570149834594, "loss": 0.0115, "step": 85530 }, { "epoch": 0.92, "learning_rate": 0.00016128948563274306, "loss": 0.0135, "step": 85540 }, { "epoch": 0.92, "learning_rate": 0.00016127326976714016, "loss": 0.0138, "step": 85550 }, { "epoch": 0.92, "learning_rate": 0.00016125705390153725, "loss": 0.0145, "step": 85560 }, { "epoch": 0.93, "learning_rate": 0.00016124083803593432, "loss": 0.0104, "step": 85570 }, { "epoch": 0.93, "learning_rate": 0.00016122462217033144, "loss": 0.0135, "step": 85580 }, { "epoch": 0.93, "learning_rate": 0.00016120840630472853, "loss": 0.0179, "step": 85590 }, { "epoch": 0.93, "learning_rate": 0.00016119219043912562, "loss": 0.0124, "step": 85600 }, { "epoch": 0.93, "learning_rate": 0.00016117597457352274, "loss": 0.0147, "step": 85610 }, { "epoch": 0.93, "learning_rate": 0.0001611597587079198, "loss": 0.0158, "step": 85620 }, { "epoch": 0.93, "learning_rate": 0.0001611435428423169, "loss": 0.0141, "step": 85630 }, { "epoch": 0.93, "learning_rate": 0.00016112732697671402, "loss": 0.014, "step": 85640 }, { "epoch": 0.93, "learning_rate": 0.0001611111111111111, "loss": 0.0131, "step": 85650 }, { "epoch": 0.93, "learning_rate": 0.00016109489524550818, "loss": 0.0139, "step": 85660 }, { "epoch": 0.93, "learning_rate": 0.0001610786793799053, "loss": 0.015, "step": 85670 }, { "epoch": 0.93, "learning_rate": 0.0001610624635143024, "loss": 0.0118, "step": 85680 }, { "epoch": 0.93, "learning_rate": 0.00016104624764869948, "loss": 0.0137, "step": 85690 }, { "epoch": 0.93, "learning_rate": 0.00016103003178309655, "loss": 0.0107, "step": 85700 }, { "epoch": 0.93, "learning_rate": 0.00016101381591749367, "loss": 0.0177, "step": 85710 }, { "epoch": 0.93, "learning_rate": 0.00016099760005189076, "loss": 0.0153, "step": 85720 }, { "epoch": 0.93, "learning_rate": 0.00016098138418628785, "loss": 0.0118, "step": 85730 }, { "epoch": 0.93, "learning_rate": 0.00016096516832068495, "loss": 0.0136, "step": 85740 }, { "epoch": 0.93, "learning_rate": 0.00016094895245508204, "loss": 0.014, "step": 85750 }, { "epoch": 0.93, "learning_rate": 0.00016093273658947913, "loss": 0.0145, "step": 85760 }, { "epoch": 0.93, "learning_rate": 0.00016091652072387625, "loss": 0.0121, "step": 85770 }, { "epoch": 0.93, "learning_rate": 0.00016090030485827332, "loss": 0.0133, "step": 85780 }, { "epoch": 0.93, "learning_rate": 0.0001608840889926704, "loss": 0.0116, "step": 85790 }, { "epoch": 0.93, "learning_rate": 0.0001608678731270675, "loss": 0.0105, "step": 85800 }, { "epoch": 0.93, "learning_rate": 0.00016085165726146462, "loss": 0.0152, "step": 85810 }, { "epoch": 0.93, "learning_rate": 0.0001608354413958617, "loss": 0.0132, "step": 85820 }, { "epoch": 0.93, "learning_rate": 0.00016081922553025878, "loss": 0.0116, "step": 85830 }, { "epoch": 0.93, "learning_rate": 0.0001608030096646559, "loss": 0.0116, "step": 85840 }, { "epoch": 0.93, "learning_rate": 0.000160786793799053, "loss": 0.0138, "step": 85850 }, { "epoch": 0.93, "learning_rate": 0.00016077057793345006, "loss": 0.0123, "step": 85860 }, { "epoch": 0.93, "learning_rate": 0.00016075436206784715, "loss": 0.0111, "step": 85870 }, { "epoch": 0.93, "learning_rate": 0.00016073814620224427, "loss": 0.0119, "step": 85880 }, { "epoch": 0.93, "learning_rate": 0.00016072193033664137, "loss": 0.0108, "step": 85890 }, { "epoch": 0.93, "learning_rate": 0.00016070571447103843, "loss": 0.013, "step": 85900 }, { "epoch": 0.93, "learning_rate": 0.00016068949860543555, "loss": 0.0125, "step": 85910 }, { "epoch": 0.93, "learning_rate": 0.00016067328273983264, "loss": 0.0159, "step": 85920 }, { "epoch": 0.93, "learning_rate": 0.00016065706687422974, "loss": 0.0119, "step": 85930 }, { "epoch": 0.93, "learning_rate": 0.0001606408510086268, "loss": 0.0158, "step": 85940 }, { "epoch": 0.93, "learning_rate": 0.00016062463514302392, "loss": 0.0139, "step": 85950 }, { "epoch": 0.93, "learning_rate": 0.00016060841927742101, "loss": 0.0168, "step": 85960 }, { "epoch": 0.93, "learning_rate": 0.00016059220341181813, "loss": 0.016, "step": 85970 }, { "epoch": 0.93, "learning_rate": 0.0001605759875462152, "loss": 0.014, "step": 85980 }, { "epoch": 0.93, "learning_rate": 0.0001605597716806123, "loss": 0.0142, "step": 85990 }, { "epoch": 0.93, "learning_rate": 0.00016054355581500939, "loss": 0.0145, "step": 86000 }, { "epoch": 0.93, "eval_cer": 0.9215278031120306, "eval_loss": 0.009139015339314938, "eval_runtime": 121.317, "eval_samples_per_second": 16.486, "eval_steps_per_second": 4.121, "step": 86000 }, { "epoch": 0.93, "learning_rate": 0.0001605273399494065, "loss": 0.0127, "step": 86010 }, { "epoch": 0.93, "learning_rate": 0.00016051112408380357, "loss": 0.0104, "step": 86020 }, { "epoch": 0.93, "learning_rate": 0.00016049490821820066, "loss": 0.0139, "step": 86030 }, { "epoch": 0.93, "learning_rate": 0.00016047869235259778, "loss": 0.0113, "step": 86040 }, { "epoch": 0.93, "learning_rate": 0.00016046247648699488, "loss": 0.0143, "step": 86050 }, { "epoch": 0.93, "learning_rate": 0.00016044626062139194, "loss": 0.0142, "step": 86060 }, { "epoch": 0.93, "learning_rate": 0.00016043004475578903, "loss": 0.0127, "step": 86070 }, { "epoch": 0.93, "learning_rate": 0.00016041382889018615, "loss": 0.0143, "step": 86080 }, { "epoch": 0.93, "learning_rate": 0.00016039761302458325, "loss": 0.0122, "step": 86090 }, { "epoch": 0.93, "learning_rate": 0.0001603813971589803, "loss": 0.0112, "step": 86100 }, { "epoch": 0.93, "learning_rate": 0.00016036518129337743, "loss": 0.014, "step": 86110 }, { "epoch": 0.93, "learning_rate": 0.00016034896542777453, "loss": 0.0136, "step": 86120 }, { "epoch": 0.93, "learning_rate": 0.00016033274956217162, "loss": 0.0111, "step": 86130 }, { "epoch": 0.93, "learning_rate": 0.00016031653369656868, "loss": 0.012, "step": 86140 }, { "epoch": 0.93, "learning_rate": 0.0001603003178309658, "loss": 0.0103, "step": 86150 }, { "epoch": 0.93, "learning_rate": 0.0001602841019653629, "loss": 0.0142, "step": 86160 }, { "epoch": 0.93, "learning_rate": 0.00016026788609976, "loss": 0.0122, "step": 86170 }, { "epoch": 0.93, "learning_rate": 0.00016025167023415708, "loss": 0.011, "step": 86180 }, { "epoch": 0.93, "learning_rate": 0.00016023545436855417, "loss": 0.0145, "step": 86190 }, { "epoch": 0.93, "learning_rate": 0.00016021923850295127, "loss": 0.0161, "step": 86200 }, { "epoch": 0.93, "learning_rate": 0.0001602030226373484, "loss": 0.013, "step": 86210 }, { "epoch": 0.93, "learning_rate": 0.00016018680677174545, "loss": 0.0096, "step": 86220 }, { "epoch": 0.93, "learning_rate": 0.00016017059090614255, "loss": 0.0111, "step": 86230 }, { "epoch": 0.93, "learning_rate": 0.00016015437504053964, "loss": 0.0136, "step": 86240 }, { "epoch": 0.93, "learning_rate": 0.00016013815917493676, "loss": 0.0128, "step": 86250 }, { "epoch": 0.93, "learning_rate": 0.00016012194330933382, "loss": 0.0128, "step": 86260 }, { "epoch": 0.93, "learning_rate": 0.00016010572744373092, "loss": 0.0133, "step": 86270 }, { "epoch": 0.93, "learning_rate": 0.00016008951157812804, "loss": 0.0126, "step": 86280 }, { "epoch": 0.93, "learning_rate": 0.00016007329571252513, "loss": 0.0109, "step": 86290 }, { "epoch": 0.93, "learning_rate": 0.0001600570798469222, "loss": 0.0139, "step": 86300 }, { "epoch": 0.93, "learning_rate": 0.0001600408639813193, "loss": 0.0106, "step": 86310 }, { "epoch": 0.93, "learning_rate": 0.0001600246481157164, "loss": 0.0172, "step": 86320 }, { "epoch": 0.93, "learning_rate": 0.0001600084322501135, "loss": 0.013, "step": 86330 }, { "epoch": 0.93, "learning_rate": 0.00015999221638451062, "loss": 0.0139, "step": 86340 }, { "epoch": 0.93, "learning_rate": 0.00015997600051890769, "loss": 0.0144, "step": 86350 }, { "epoch": 0.93, "learning_rate": 0.00015995978465330478, "loss": 0.0162, "step": 86360 }, { "epoch": 0.93, "learning_rate": 0.00015994356878770187, "loss": 0.0126, "step": 86370 }, { "epoch": 0.93, "learning_rate": 0.000159927352922099, "loss": 0.0122, "step": 86380 }, { "epoch": 0.93, "learning_rate": 0.00015991113705649606, "loss": 0.0162, "step": 86390 }, { "epoch": 0.93, "learning_rate": 0.00015989492119089315, "loss": 0.0124, "step": 86400 }, { "epoch": 0.93, "learning_rate": 0.00015987870532529027, "loss": 0.0123, "step": 86410 }, { "epoch": 0.93, "learning_rate": 0.00015986248945968736, "loss": 0.0127, "step": 86420 }, { "epoch": 0.93, "learning_rate": 0.00015984627359408443, "loss": 0.0119, "step": 86430 }, { "epoch": 0.93, "learning_rate": 0.00015983005772848152, "loss": 0.0118, "step": 86440 }, { "epoch": 0.93, "learning_rate": 0.00015981384186287864, "loss": 0.0118, "step": 86450 }, { "epoch": 0.93, "learning_rate": 0.00015979762599727573, "loss": 0.0115, "step": 86460 }, { "epoch": 0.93, "learning_rate": 0.0001597814101316728, "loss": 0.011, "step": 86470 }, { "epoch": 0.93, "learning_rate": 0.00015976519426606992, "loss": 0.0136, "step": 86480 }, { "epoch": 0.93, "learning_rate": 0.000159748978400467, "loss": 0.0139, "step": 86490 }, { "epoch": 0.94, "learning_rate": 0.0001597327625348641, "loss": 0.016, "step": 86500 }, { "epoch": 0.94, "learning_rate": 0.00015971654666926117, "loss": 0.0111, "step": 86510 }, { "epoch": 0.94, "learning_rate": 0.0001597003308036583, "loss": 0.0141, "step": 86520 }, { "epoch": 0.94, "learning_rate": 0.00015968411493805538, "loss": 0.0173, "step": 86530 }, { "epoch": 0.94, "learning_rate": 0.00015966789907245247, "loss": 0.0145, "step": 86540 }, { "epoch": 0.94, "learning_rate": 0.00015965168320684957, "loss": 0.0106, "step": 86550 }, { "epoch": 0.94, "learning_rate": 0.00015963546734124666, "loss": 0.0153, "step": 86560 }, { "epoch": 0.94, "learning_rate": 0.00015961925147564375, "loss": 0.0134, "step": 86570 }, { "epoch": 0.94, "learning_rate": 0.00015960303561004087, "loss": 0.0147, "step": 86580 }, { "epoch": 0.94, "learning_rate": 0.00015958681974443794, "loss": 0.0136, "step": 86590 }, { "epoch": 0.94, "learning_rate": 0.00015957060387883503, "loss": 0.0114, "step": 86600 }, { "epoch": 0.94, "learning_rate": 0.00015955438801323212, "loss": 0.0103, "step": 86610 }, { "epoch": 0.94, "learning_rate": 0.00015953817214762924, "loss": 0.0128, "step": 86620 }, { "epoch": 0.94, "learning_rate": 0.0001595219562820263, "loss": 0.0105, "step": 86630 }, { "epoch": 0.94, "learning_rate": 0.0001595057404164234, "loss": 0.0139, "step": 86640 }, { "epoch": 0.94, "learning_rate": 0.00015948952455082052, "loss": 0.0117, "step": 86650 }, { "epoch": 0.94, "learning_rate": 0.00015947330868521761, "loss": 0.0107, "step": 86660 }, { "epoch": 0.94, "learning_rate": 0.00015945709281961468, "loss": 0.0145, "step": 86670 }, { "epoch": 0.94, "learning_rate": 0.0001594408769540118, "loss": 0.0128, "step": 86680 }, { "epoch": 0.94, "learning_rate": 0.0001594246610884089, "loss": 0.0129, "step": 86690 }, { "epoch": 0.94, "learning_rate": 0.00015940844522280599, "loss": 0.014, "step": 86700 }, { "epoch": 0.94, "learning_rate": 0.00015939222935720305, "loss": 0.0132, "step": 86710 }, { "epoch": 0.94, "learning_rate": 0.00015937601349160017, "loss": 0.0128, "step": 86720 }, { "epoch": 0.94, "learning_rate": 0.00015935979762599726, "loss": 0.0129, "step": 86730 }, { "epoch": 0.94, "learning_rate": 0.00015934358176039436, "loss": 0.0096, "step": 86740 }, { "epoch": 0.94, "learning_rate": 0.00015932736589479145, "loss": 0.0117, "step": 86750 }, { "epoch": 0.94, "learning_rate": 0.00015931115002918854, "loss": 0.013, "step": 86760 }, { "epoch": 0.94, "learning_rate": 0.00015929493416358563, "loss": 0.0118, "step": 86770 }, { "epoch": 0.94, "learning_rate": 0.00015927871829798275, "loss": 0.0113, "step": 86780 }, { "epoch": 0.94, "learning_rate": 0.00015926250243237982, "loss": 0.0106, "step": 86790 }, { "epoch": 0.94, "learning_rate": 0.0001592462865667769, "loss": 0.0127, "step": 86800 }, { "epoch": 0.94, "learning_rate": 0.000159230070701174, "loss": 0.0119, "step": 86810 }, { "epoch": 0.94, "learning_rate": 0.00015921385483557113, "loss": 0.0117, "step": 86820 }, { "epoch": 0.94, "learning_rate": 0.0001591976389699682, "loss": 0.0113, "step": 86830 }, { "epoch": 0.94, "learning_rate": 0.00015918142310436528, "loss": 0.0141, "step": 86840 }, { "epoch": 0.94, "learning_rate": 0.0001591652072387624, "loss": 0.0128, "step": 86850 }, { "epoch": 0.94, "learning_rate": 0.0001591489913731595, "loss": 0.0094, "step": 86860 }, { "epoch": 0.94, "learning_rate": 0.00015913277550755656, "loss": 0.0116, "step": 86870 }, { "epoch": 0.94, "learning_rate": 0.00015911655964195366, "loss": 0.0123, "step": 86880 }, { "epoch": 0.94, "learning_rate": 0.00015910034377635077, "loss": 0.0125, "step": 86890 }, { "epoch": 0.94, "learning_rate": 0.00015908412791074787, "loss": 0.0122, "step": 86900 }, { "epoch": 0.94, "learning_rate": 0.00015906791204514493, "loss": 0.0122, "step": 86910 }, { "epoch": 0.94, "learning_rate": 0.00015905169617954205, "loss": 0.0111, "step": 86920 }, { "epoch": 0.94, "learning_rate": 0.00015903548031393915, "loss": 0.0121, "step": 86930 }, { "epoch": 0.94, "learning_rate": 0.00015901926444833624, "loss": 0.0138, "step": 86940 }, { "epoch": 0.94, "learning_rate": 0.0001590030485827333, "loss": 0.0124, "step": 86950 }, { "epoch": 0.94, "learning_rate": 0.00015898683271713042, "loss": 0.0123, "step": 86960 }, { "epoch": 0.94, "learning_rate": 0.00015897061685152752, "loss": 0.0129, "step": 86970 }, { "epoch": 0.94, "learning_rate": 0.00015895440098592464, "loss": 0.012, "step": 86980 }, { "epoch": 0.94, "learning_rate": 0.0001589381851203217, "loss": 0.0123, "step": 86990 }, { "epoch": 0.94, "learning_rate": 0.0001589219692547188, "loss": 0.0121, "step": 87000 }, { "epoch": 0.94, "eval_cer": 0.921526065906118, "eval_loss": 0.008875695057213306, "eval_runtime": 121.5017, "eval_samples_per_second": 16.461, "eval_steps_per_second": 4.115, "step": 87000 }, { "epoch": 0.94, "learning_rate": 0.0001589057533891159, "loss": 0.0142, "step": 87010 }, { "epoch": 0.94, "learning_rate": 0.000158889537523513, "loss": 0.0114, "step": 87020 }, { "epoch": 0.94, "learning_rate": 0.00015887332165791007, "loss": 0.011, "step": 87030 }, { "epoch": 0.94, "learning_rate": 0.00015885710579230717, "loss": 0.0122, "step": 87040 }, { "epoch": 0.94, "learning_rate": 0.00015884088992670429, "loss": 0.0124, "step": 87050 }, { "epoch": 0.94, "learning_rate": 0.00015882467406110138, "loss": 0.0141, "step": 87060 }, { "epoch": 0.94, "learning_rate": 0.00015880845819549847, "loss": 0.0163, "step": 87070 }, { "epoch": 0.94, "learning_rate": 0.00015879224232989554, "loss": 0.0156, "step": 87080 }, { "epoch": 0.94, "learning_rate": 0.00015877602646429266, "loss": 0.0124, "step": 87090 }, { "epoch": 0.94, "learning_rate": 0.00015875981059868975, "loss": 0.0145, "step": 87100 }, { "epoch": 0.94, "learning_rate": 0.00015874359473308684, "loss": 0.0134, "step": 87110 }, { "epoch": 0.94, "learning_rate": 0.00015872737886748394, "loss": 0.0134, "step": 87120 }, { "epoch": 0.94, "learning_rate": 0.00015871116300188103, "loss": 0.0115, "step": 87130 }, { "epoch": 0.94, "learning_rate": 0.00015869494713627812, "loss": 0.0116, "step": 87140 }, { "epoch": 0.94, "learning_rate": 0.00015867873127067524, "loss": 0.0124, "step": 87150 }, { "epoch": 0.94, "learning_rate": 0.0001586625154050723, "loss": 0.0122, "step": 87160 }, { "epoch": 0.94, "learning_rate": 0.0001586462995394694, "loss": 0.0103, "step": 87170 }, { "epoch": 0.94, "learning_rate": 0.0001586300836738665, "loss": 0.0133, "step": 87180 }, { "epoch": 0.94, "learning_rate": 0.0001586138678082636, "loss": 0.0127, "step": 87190 }, { "epoch": 0.94, "learning_rate": 0.00015859765194266068, "loss": 0.0156, "step": 87200 }, { "epoch": 0.94, "learning_rate": 0.00015858143607705777, "loss": 0.0147, "step": 87210 }, { "epoch": 0.94, "learning_rate": 0.0001585652202114549, "loss": 0.0151, "step": 87220 }, { "epoch": 0.94, "learning_rate": 0.00015854900434585198, "loss": 0.0118, "step": 87230 }, { "epoch": 0.94, "learning_rate": 0.00015853278848024905, "loss": 0.0134, "step": 87240 }, { "epoch": 0.94, "learning_rate": 0.00015851657261464614, "loss": 0.0125, "step": 87250 }, { "epoch": 0.94, "learning_rate": 0.00015850035674904326, "loss": 0.0143, "step": 87260 }, { "epoch": 0.94, "learning_rate": 0.00015848414088344035, "loss": 0.0131, "step": 87270 }, { "epoch": 0.94, "learning_rate": 0.00015846792501783742, "loss": 0.0144, "step": 87280 }, { "epoch": 0.94, "learning_rate": 0.00015845170915223454, "loss": 0.013, "step": 87290 }, { "epoch": 0.94, "learning_rate": 0.00015843549328663163, "loss": 0.0116, "step": 87300 }, { "epoch": 0.94, "learning_rate": 0.00015841927742102872, "loss": 0.0129, "step": 87310 }, { "epoch": 0.94, "learning_rate": 0.0001584030615554258, "loss": 0.0154, "step": 87320 }, { "epoch": 0.94, "learning_rate": 0.0001583868456898229, "loss": 0.0137, "step": 87330 }, { "epoch": 0.94, "learning_rate": 0.00015837062982422, "loss": 0.0112, "step": 87340 }, { "epoch": 0.94, "learning_rate": 0.00015835441395861712, "loss": 0.0167, "step": 87350 }, { "epoch": 0.94, "learning_rate": 0.0001583381980930142, "loss": 0.0163, "step": 87360 }, { "epoch": 0.94, "learning_rate": 0.00015832198222741128, "loss": 0.0134, "step": 87370 }, { "epoch": 0.94, "learning_rate": 0.00015830576636180837, "loss": 0.0131, "step": 87380 }, { "epoch": 0.94, "learning_rate": 0.0001582895504962055, "loss": 0.0107, "step": 87390 }, { "epoch": 0.94, "learning_rate": 0.00015827333463060256, "loss": 0.0129, "step": 87400 }, { "epoch": 0.94, "learning_rate": 0.00015825711876499965, "loss": 0.0116, "step": 87410 }, { "epoch": 0.95, "learning_rate": 0.00015824090289939677, "loss": 0.0141, "step": 87420 }, { "epoch": 0.95, "learning_rate": 0.00015822468703379386, "loss": 0.0126, "step": 87430 }, { "epoch": 0.95, "learning_rate": 0.00015820847116819093, "loss": 0.0157, "step": 87440 }, { "epoch": 0.95, "learning_rate": 0.00015819225530258802, "loss": 0.0149, "step": 87450 }, { "epoch": 0.95, "learning_rate": 0.00015817603943698514, "loss": 0.0121, "step": 87460 }, { "epoch": 0.95, "learning_rate": 0.00015815982357138224, "loss": 0.016, "step": 87470 }, { "epoch": 0.95, "learning_rate": 0.0001581436077057793, "loss": 0.016, "step": 87480 }, { "epoch": 0.95, "learning_rate": 0.00015812739184017642, "loss": 0.0124, "step": 87490 }, { "epoch": 0.95, "learning_rate": 0.0001581111759745735, "loss": 0.0138, "step": 87500 }, { "epoch": 0.95, "learning_rate": 0.0001580949601089706, "loss": 0.0105, "step": 87510 }, { "epoch": 0.95, "learning_rate": 0.00015807874424336767, "loss": 0.013, "step": 87520 }, { "epoch": 0.95, "learning_rate": 0.0001580625283777648, "loss": 0.0113, "step": 87530 }, { "epoch": 0.95, "learning_rate": 0.00015804631251216188, "loss": 0.0152, "step": 87540 }, { "epoch": 0.95, "learning_rate": 0.00015803009664655898, "loss": 0.0153, "step": 87550 }, { "epoch": 0.95, "learning_rate": 0.00015801388078095607, "loss": 0.0141, "step": 87560 }, { "epoch": 0.95, "learning_rate": 0.00015799766491535316, "loss": 0.0113, "step": 87570 }, { "epoch": 0.95, "learning_rate": 0.00015798144904975026, "loss": 0.0144, "step": 87580 }, { "epoch": 0.95, "learning_rate": 0.00015796523318414738, "loss": 0.0148, "step": 87590 }, { "epoch": 0.95, "learning_rate": 0.00015794901731854444, "loss": 0.0154, "step": 87600 }, { "epoch": 0.95, "learning_rate": 0.00015793280145294153, "loss": 0.0152, "step": 87610 }, { "epoch": 0.95, "learning_rate": 0.00015791658558733863, "loss": 0.0103, "step": 87620 }, { "epoch": 0.95, "learning_rate": 0.00015790036972173575, "loss": 0.016, "step": 87630 }, { "epoch": 0.95, "learning_rate": 0.0001578841538561328, "loss": 0.0116, "step": 87640 }, { "epoch": 0.95, "learning_rate": 0.0001578679379905299, "loss": 0.0122, "step": 87650 }, { "epoch": 0.95, "learning_rate": 0.00015785172212492702, "loss": 0.0125, "step": 87660 }, { "epoch": 0.95, "learning_rate": 0.00015783550625932412, "loss": 0.0133, "step": 87670 }, { "epoch": 0.95, "learning_rate": 0.00015781929039372118, "loss": 0.0119, "step": 87680 }, { "epoch": 0.95, "learning_rate": 0.0001578030745281183, "loss": 0.0134, "step": 87690 }, { "epoch": 0.95, "learning_rate": 0.0001577868586625154, "loss": 0.011, "step": 87700 }, { "epoch": 0.95, "learning_rate": 0.0001577706427969125, "loss": 0.0164, "step": 87710 }, { "epoch": 0.95, "learning_rate": 0.00015775442693130955, "loss": 0.0104, "step": 87720 }, { "epoch": 0.95, "learning_rate": 0.00015773821106570667, "loss": 0.0125, "step": 87730 }, { "epoch": 0.95, "learning_rate": 0.00015772199520010377, "loss": 0.0146, "step": 87740 }, { "epoch": 0.95, "learning_rate": 0.00015770577933450086, "loss": 0.012, "step": 87750 }, { "epoch": 0.95, "learning_rate": 0.00015768956346889798, "loss": 0.0146, "step": 87760 }, { "epoch": 0.95, "learning_rate": 0.00015767334760329504, "loss": 0.013, "step": 87770 }, { "epoch": 0.95, "learning_rate": 0.00015765713173769214, "loss": 0.0153, "step": 87780 }, { "epoch": 0.95, "learning_rate": 0.00015764091587208926, "loss": 0.0138, "step": 87790 }, { "epoch": 0.95, "learning_rate": 0.00015762470000648635, "loss": 0.0121, "step": 87800 }, { "epoch": 0.95, "learning_rate": 0.00015760848414088342, "loss": 0.0152, "step": 87810 }, { "epoch": 0.95, "learning_rate": 0.0001575922682752805, "loss": 0.0128, "step": 87820 }, { "epoch": 0.95, "learning_rate": 0.00015757605240967763, "loss": 0.0115, "step": 87830 }, { "epoch": 0.95, "learning_rate": 0.00015755983654407472, "loss": 0.01, "step": 87840 }, { "epoch": 0.95, "learning_rate": 0.0001575436206784718, "loss": 0.0133, "step": 87850 }, { "epoch": 0.95, "learning_rate": 0.0001575274048128689, "loss": 0.0104, "step": 87860 }, { "epoch": 0.95, "learning_rate": 0.000157511188947266, "loss": 0.0115, "step": 87870 }, { "epoch": 0.95, "learning_rate": 0.0001574949730816631, "loss": 0.0136, "step": 87880 }, { "epoch": 0.95, "learning_rate": 0.00015747875721606016, "loss": 0.0108, "step": 87890 }, { "epoch": 0.95, "learning_rate": 0.00015746254135045728, "loss": 0.0113, "step": 87900 }, { "epoch": 0.95, "learning_rate": 0.00015744632548485437, "loss": 0.014, "step": 87910 }, { "epoch": 0.95, "learning_rate": 0.0001574301096192515, "loss": 0.0156, "step": 87920 }, { "epoch": 0.95, "learning_rate": 0.00015741389375364856, "loss": 0.0144, "step": 87930 }, { "epoch": 0.95, "learning_rate": 0.00015739767788804565, "loss": 0.0127, "step": 87940 }, { "epoch": 0.95, "learning_rate": 0.00015738146202244274, "loss": 0.0135, "step": 87950 }, { "epoch": 0.95, "learning_rate": 0.00015736524615683986, "loss": 0.0136, "step": 87960 }, { "epoch": 0.95, "learning_rate": 0.00015734903029123693, "loss": 0.012, "step": 87970 }, { "epoch": 0.95, "learning_rate": 0.00015733281442563402, "loss": 0.0136, "step": 87980 }, { "epoch": 0.95, "learning_rate": 0.00015731659856003114, "loss": 0.0106, "step": 87990 }, { "epoch": 0.95, "learning_rate": 0.00015730038269442823, "loss": 0.0125, "step": 88000 }, { "epoch": 0.95, "eval_cer": 0.9215382263475072, "eval_loss": 0.009381990879774094, "eval_runtime": 121.3259, "eval_samples_per_second": 16.485, "eval_steps_per_second": 4.121, "step": 88000 }, { "epoch": 0.95, "learning_rate": 0.0001572841668288253, "loss": 0.0133, "step": 88010 }, { "epoch": 0.95, "learning_rate": 0.0001572679509632224, "loss": 0.0147, "step": 88020 }, { "epoch": 0.95, "learning_rate": 0.0001572517350976195, "loss": 0.0137, "step": 88030 }, { "epoch": 0.95, "learning_rate": 0.0001572355192320166, "loss": 0.0128, "step": 88040 }, { "epoch": 0.95, "learning_rate": 0.00015721930336641367, "loss": 0.0126, "step": 88050 }, { "epoch": 0.95, "learning_rate": 0.0001572030875008108, "loss": 0.0127, "step": 88060 }, { "epoch": 0.95, "learning_rate": 0.00015718687163520788, "loss": 0.015, "step": 88070 }, { "epoch": 0.95, "learning_rate": 0.00015717065576960497, "loss": 0.0116, "step": 88080 }, { "epoch": 0.95, "learning_rate": 0.00015715443990400204, "loss": 0.0132, "step": 88090 }, { "epoch": 0.95, "learning_rate": 0.00015713822403839916, "loss": 0.014, "step": 88100 }, { "epoch": 0.95, "learning_rate": 0.00015712200817279625, "loss": 0.0106, "step": 88110 }, { "epoch": 0.95, "learning_rate": 0.00015710579230719334, "loss": 0.0123, "step": 88120 }, { "epoch": 0.95, "learning_rate": 0.00015708957644159044, "loss": 0.0156, "step": 88130 }, { "epoch": 0.95, "learning_rate": 0.00015707336057598753, "loss": 0.0141, "step": 88140 }, { "epoch": 0.95, "learning_rate": 0.00015705714471038462, "loss": 0.0122, "step": 88150 }, { "epoch": 0.95, "learning_rate": 0.00015704092884478174, "loss": 0.0137, "step": 88160 }, { "epoch": 0.95, "learning_rate": 0.0001570247129791788, "loss": 0.0127, "step": 88170 }, { "epoch": 0.95, "learning_rate": 0.0001570084971135759, "loss": 0.0124, "step": 88180 }, { "epoch": 0.95, "learning_rate": 0.000156992281247973, "loss": 0.0143, "step": 88190 }, { "epoch": 0.95, "learning_rate": 0.00015697606538237011, "loss": 0.0118, "step": 88200 }, { "epoch": 0.95, "learning_rate": 0.00015695984951676718, "loss": 0.0149, "step": 88210 }, { "epoch": 0.95, "learning_rate": 0.00015694363365116427, "loss": 0.0121, "step": 88220 }, { "epoch": 0.95, "learning_rate": 0.0001569274177855614, "loss": 0.0113, "step": 88230 }, { "epoch": 0.95, "learning_rate": 0.00015691120191995848, "loss": 0.0132, "step": 88240 }, { "epoch": 0.95, "learning_rate": 0.00015689498605435555, "loss": 0.0118, "step": 88250 }, { "epoch": 0.95, "learning_rate": 0.00015687877018875264, "loss": 0.0136, "step": 88260 }, { "epoch": 0.95, "learning_rate": 0.00015686255432314976, "loss": 0.0127, "step": 88270 }, { "epoch": 0.95, "learning_rate": 0.00015684633845754686, "loss": 0.0107, "step": 88280 }, { "epoch": 0.95, "learning_rate": 0.00015683012259194392, "loss": 0.0113, "step": 88290 }, { "epoch": 0.95, "learning_rate": 0.00015681390672634104, "loss": 0.0121, "step": 88300 }, { "epoch": 0.95, "learning_rate": 0.00015679769086073813, "loss": 0.0105, "step": 88310 }, { "epoch": 0.95, "learning_rate": 0.00015678147499513523, "loss": 0.0129, "step": 88320 }, { "epoch": 0.95, "learning_rate": 0.0001567652591295323, "loss": 0.0153, "step": 88330 }, { "epoch": 0.95, "learning_rate": 0.0001567490432639294, "loss": 0.0178, "step": 88340 }, { "epoch": 0.96, "learning_rate": 0.0001567328273983265, "loss": 0.0166, "step": 88350 }, { "epoch": 0.96, "learning_rate": 0.00015671661153272363, "loss": 0.0148, "step": 88360 }, { "epoch": 0.96, "learning_rate": 0.0001567003956671207, "loss": 0.0126, "step": 88370 }, { "epoch": 0.96, "learning_rate": 0.00015668417980151778, "loss": 0.014, "step": 88380 }, { "epoch": 0.96, "learning_rate": 0.00015666796393591488, "loss": 0.0131, "step": 88390 }, { "epoch": 0.96, "learning_rate": 0.000156651748070312, "loss": 0.0111, "step": 88400 }, { "epoch": 0.96, "learning_rate": 0.00015663553220470906, "loss": 0.0119, "step": 88410 }, { "epoch": 0.96, "learning_rate": 0.00015661931633910615, "loss": 0.0115, "step": 88420 }, { "epoch": 0.96, "learning_rate": 0.00015660310047350327, "loss": 0.0123, "step": 88430 }, { "epoch": 0.96, "learning_rate": 0.00015658688460790037, "loss": 0.0114, "step": 88440 }, { "epoch": 0.96, "learning_rate": 0.00015657066874229743, "loss": 0.0168, "step": 88450 }, { "epoch": 0.96, "learning_rate": 0.00015655445287669453, "loss": 0.0176, "step": 88460 }, { "epoch": 0.96, "learning_rate": 0.00015653823701109165, "loss": 0.0113, "step": 88470 }, { "epoch": 0.96, "learning_rate": 0.00015652202114548874, "loss": 0.0116, "step": 88480 }, { "epoch": 0.96, "learning_rate": 0.00015650580527988583, "loss": 0.0117, "step": 88490 }, { "epoch": 0.96, "learning_rate": 0.00015648958941428292, "loss": 0.0115, "step": 88500 }, { "epoch": 0.96, "learning_rate": 0.00015647337354868002, "loss": 0.0145, "step": 88510 }, { "epoch": 0.96, "learning_rate": 0.0001564571576830771, "loss": 0.013, "step": 88520 }, { "epoch": 0.96, "learning_rate": 0.00015644094181747423, "loss": 0.01, "step": 88530 }, { "epoch": 0.96, "learning_rate": 0.0001564247259518713, "loss": 0.0122, "step": 88540 }, { "epoch": 0.96, "learning_rate": 0.0001564085100862684, "loss": 0.0139, "step": 88550 }, { "epoch": 0.96, "learning_rate": 0.00015639229422066548, "loss": 0.0124, "step": 88560 }, { "epoch": 0.96, "learning_rate": 0.0001563760783550626, "loss": 0.0154, "step": 88570 }, { "epoch": 0.96, "learning_rate": 0.00015635986248945967, "loss": 0.0127, "step": 88580 }, { "epoch": 0.96, "learning_rate": 0.00015634364662385676, "loss": 0.0107, "step": 88590 }, { "epoch": 0.96, "learning_rate": 0.00015632743075825388, "loss": 0.0155, "step": 88600 }, { "epoch": 0.96, "learning_rate": 0.00015631121489265097, "loss": 0.0188, "step": 88610 }, { "epoch": 0.96, "learning_rate": 0.00015629499902704804, "loss": 0.0135, "step": 88620 }, { "epoch": 0.96, "learning_rate": 0.00015627878316144513, "loss": 0.0123, "step": 88630 }, { "epoch": 0.96, "learning_rate": 0.00015626256729584225, "loss": 0.0102, "step": 88640 }, { "epoch": 0.96, "learning_rate": 0.00015624635143023934, "loss": 0.0125, "step": 88650 }, { "epoch": 0.96, "learning_rate": 0.0001562301355646364, "loss": 0.0136, "step": 88660 }, { "epoch": 0.96, "learning_rate": 0.00015621391969903353, "loss": 0.0178, "step": 88670 }, { "epoch": 0.96, "learning_rate": 0.00015619770383343062, "loss": 0.0143, "step": 88680 }, { "epoch": 0.96, "learning_rate": 0.0001561814879678277, "loss": 0.0108, "step": 88690 }, { "epoch": 0.96, "learning_rate": 0.0001561652721022248, "loss": 0.0127, "step": 88700 }, { "epoch": 0.96, "learning_rate": 0.0001561490562366219, "loss": 0.0144, "step": 88710 }, { "epoch": 0.96, "learning_rate": 0.000156132840371019, "loss": 0.0126, "step": 88720 }, { "epoch": 0.96, "learning_rate": 0.0001561166245054161, "loss": 0.0115, "step": 88730 }, { "epoch": 0.96, "learning_rate": 0.00015610040863981318, "loss": 0.0134, "step": 88740 }, { "epoch": 0.96, "learning_rate": 0.00015608419277421027, "loss": 0.0142, "step": 88750 }, { "epoch": 0.96, "learning_rate": 0.00015606797690860736, "loss": 0.0131, "step": 88760 }, { "epoch": 0.96, "learning_rate": 0.00015605176104300448, "loss": 0.013, "step": 88770 }, { "epoch": 0.96, "learning_rate": 0.00015603554517740155, "loss": 0.0142, "step": 88780 }, { "epoch": 0.96, "learning_rate": 0.00015601932931179864, "loss": 0.011, "step": 88790 }, { "epoch": 0.96, "learning_rate": 0.00015600311344619576, "loss": 0.011, "step": 88800 }, { "epoch": 0.96, "learning_rate": 0.00015598689758059285, "loss": 0.0143, "step": 88810 }, { "epoch": 0.96, "learning_rate": 0.00015597068171498992, "loss": 0.0151, "step": 88820 }, { "epoch": 0.96, "learning_rate": 0.000155954465849387, "loss": 0.0126, "step": 88830 }, { "epoch": 0.96, "learning_rate": 0.00015593824998378413, "loss": 0.013, "step": 88840 }, { "epoch": 0.96, "learning_rate": 0.00015592203411818122, "loss": 0.0129, "step": 88850 }, { "epoch": 0.96, "learning_rate": 0.0001559058182525783, "loss": 0.0118, "step": 88860 }, { "epoch": 0.96, "learning_rate": 0.0001558896023869754, "loss": 0.0108, "step": 88870 }, { "epoch": 0.96, "learning_rate": 0.0001558733865213725, "loss": 0.0123, "step": 88880 }, { "epoch": 0.96, "learning_rate": 0.0001558571706557696, "loss": 0.013, "step": 88890 }, { "epoch": 0.96, "learning_rate": 0.00015584095479016666, "loss": 0.0136, "step": 88900 }, { "epoch": 0.96, "learning_rate": 0.00015582473892456378, "loss": 0.013, "step": 88910 }, { "epoch": 0.96, "learning_rate": 0.00015580852305896087, "loss": 0.0125, "step": 88920 }, { "epoch": 0.96, "learning_rate": 0.000155792307193358, "loss": 0.0112, "step": 88930 }, { "epoch": 0.96, "learning_rate": 0.00015577609132775506, "loss": 0.012, "step": 88940 }, { "epoch": 0.96, "learning_rate": 0.00015575987546215215, "loss": 0.0141, "step": 88950 }, { "epoch": 0.96, "learning_rate": 0.00015574365959654924, "loss": 0.0146, "step": 88960 }, { "epoch": 0.96, "learning_rate": 0.00015572744373094636, "loss": 0.0124, "step": 88970 }, { "epoch": 0.96, "learning_rate": 0.00015571122786534343, "loss": 0.0113, "step": 88980 }, { "epoch": 0.96, "learning_rate": 0.00015569501199974052, "loss": 0.016, "step": 88990 }, { "epoch": 0.96, "learning_rate": 0.00015567879613413764, "loss": 0.0113, "step": 89000 }, { "epoch": 0.96, "eval_cer": 0.9215721018628059, "eval_loss": 0.008774230256676674, "eval_runtime": 121.1545, "eval_samples_per_second": 16.508, "eval_steps_per_second": 4.127, "step": 89000 }, { "epoch": 0.96, "learning_rate": 0.00015566258026853473, "loss": 0.0099, "step": 89010 }, { "epoch": 0.96, "learning_rate": 0.0001556463644029318, "loss": 0.0121, "step": 89020 }, { "epoch": 0.96, "learning_rate": 0.0001556301485373289, "loss": 0.0121, "step": 89030 }, { "epoch": 0.96, "learning_rate": 0.000155613932671726, "loss": 0.0141, "step": 89040 }, { "epoch": 0.96, "learning_rate": 0.0001555977168061231, "loss": 0.0113, "step": 89050 }, { "epoch": 0.96, "learning_rate": 0.00015558150094052017, "loss": 0.0121, "step": 89060 }, { "epoch": 0.96, "learning_rate": 0.0001555652850749173, "loss": 0.012, "step": 89070 }, { "epoch": 0.96, "learning_rate": 0.00015554906920931438, "loss": 0.0153, "step": 89080 }, { "epoch": 0.96, "learning_rate": 0.00015553285334371148, "loss": 0.014, "step": 89090 }, { "epoch": 0.96, "learning_rate": 0.00015551663747810854, "loss": 0.0124, "step": 89100 }, { "epoch": 0.96, "learning_rate": 0.00015550042161250566, "loss": 0.0138, "step": 89110 }, { "epoch": 0.96, "learning_rate": 0.00015548420574690275, "loss": 0.0135, "step": 89120 }, { "epoch": 0.96, "learning_rate": 0.00015546798988129985, "loss": 0.0159, "step": 89130 }, { "epoch": 0.96, "learning_rate": 0.00015545177401569694, "loss": 0.0138, "step": 89140 }, { "epoch": 0.96, "learning_rate": 0.00015543555815009403, "loss": 0.0143, "step": 89150 }, { "epoch": 0.96, "learning_rate": 0.00015541934228449113, "loss": 0.0137, "step": 89160 }, { "epoch": 0.96, "learning_rate": 0.00015540312641888825, "loss": 0.0137, "step": 89170 }, { "epoch": 0.96, "learning_rate": 0.0001553869105532853, "loss": 0.013, "step": 89180 }, { "epoch": 0.96, "learning_rate": 0.0001553706946876824, "loss": 0.0125, "step": 89190 }, { "epoch": 0.96, "learning_rate": 0.0001553544788220795, "loss": 0.0134, "step": 89200 }, { "epoch": 0.96, "learning_rate": 0.00015533826295647662, "loss": 0.0132, "step": 89210 }, { "epoch": 0.96, "learning_rate": 0.0001553220470908737, "loss": 0.014, "step": 89220 }, { "epoch": 0.96, "learning_rate": 0.00015530583122527077, "loss": 0.0117, "step": 89230 }, { "epoch": 0.96, "learning_rate": 0.0001552896153596679, "loss": 0.0107, "step": 89240 }, { "epoch": 0.96, "learning_rate": 0.000155273399494065, "loss": 0.0122, "step": 89250 }, { "epoch": 0.96, "learning_rate": 0.00015525718362846208, "loss": 0.0129, "step": 89260 }, { "epoch": 0.97, "learning_rate": 0.00015524096776285915, "loss": 0.0137, "step": 89270 }, { "epoch": 0.97, "learning_rate": 0.00015522475189725627, "loss": 0.0152, "step": 89280 }, { "epoch": 0.97, "learning_rate": 0.00015520853603165336, "loss": 0.0135, "step": 89290 }, { "epoch": 0.97, "learning_rate": 0.00015519232016605048, "loss": 0.0148, "step": 89300 }, { "epoch": 0.97, "learning_rate": 0.00015517610430044754, "loss": 0.0125, "step": 89310 }, { "epoch": 0.97, "learning_rate": 0.00015515988843484464, "loss": 0.0125, "step": 89320 }, { "epoch": 0.97, "learning_rate": 0.00015514367256924173, "loss": 0.0098, "step": 89330 }, { "epoch": 0.97, "learning_rate": 0.00015512745670363885, "loss": 0.0122, "step": 89340 }, { "epoch": 0.97, "learning_rate": 0.00015511124083803592, "loss": 0.0121, "step": 89350 }, { "epoch": 0.97, "learning_rate": 0.000155095024972433, "loss": 0.0119, "step": 89360 }, { "epoch": 0.97, "learning_rate": 0.00015507880910683013, "loss": 0.013, "step": 89370 }, { "epoch": 0.97, "learning_rate": 0.00015506259324122722, "loss": 0.0133, "step": 89380 }, { "epoch": 0.97, "learning_rate": 0.00015504637737562429, "loss": 0.0129, "step": 89390 }, { "epoch": 0.97, "learning_rate": 0.00015503016151002138, "loss": 0.0122, "step": 89400 }, { "epoch": 0.97, "learning_rate": 0.0001550139456444185, "loss": 0.0115, "step": 89410 }, { "epoch": 0.97, "learning_rate": 0.0001549977297788156, "loss": 0.0139, "step": 89420 }, { "epoch": 0.97, "learning_rate": 0.00015498151391321266, "loss": 0.0111, "step": 89430 }, { "epoch": 0.97, "learning_rate": 0.00015496529804760978, "loss": 0.0106, "step": 89440 }, { "epoch": 0.97, "learning_rate": 0.00015494908218200687, "loss": 0.0137, "step": 89450 }, { "epoch": 0.97, "learning_rate": 0.00015493286631640396, "loss": 0.015, "step": 89460 }, { "epoch": 0.97, "learning_rate": 0.00015491665045080103, "loss": 0.0145, "step": 89470 }, { "epoch": 0.97, "learning_rate": 0.00015490043458519815, "loss": 0.0103, "step": 89480 }, { "epoch": 0.97, "learning_rate": 0.00015488421871959524, "loss": 0.0118, "step": 89490 }, { "epoch": 0.97, "learning_rate": 0.00015486800285399233, "loss": 0.0134, "step": 89500 }, { "epoch": 0.97, "learning_rate": 0.00015485178698838943, "loss": 0.0124, "step": 89510 }, { "epoch": 0.97, "learning_rate": 0.00015483557112278652, "loss": 0.0122, "step": 89520 }, { "epoch": 0.97, "learning_rate": 0.0001548193552571836, "loss": 0.0114, "step": 89530 }, { "epoch": 0.97, "learning_rate": 0.00015480313939158073, "loss": 0.0168, "step": 89540 }, { "epoch": 0.97, "learning_rate": 0.0001547869235259778, "loss": 0.0144, "step": 89550 }, { "epoch": 0.97, "learning_rate": 0.0001547707076603749, "loss": 0.0162, "step": 89560 }, { "epoch": 0.97, "learning_rate": 0.00015475449179477198, "loss": 0.013, "step": 89570 }, { "epoch": 0.97, "learning_rate": 0.0001547382759291691, "loss": 0.0133, "step": 89580 }, { "epoch": 0.97, "learning_rate": 0.00015472206006356617, "loss": 0.0095, "step": 89590 }, { "epoch": 0.97, "learning_rate": 0.00015470584419796326, "loss": 0.0118, "step": 89600 }, { "epoch": 0.97, "learning_rate": 0.00015468962833236038, "loss": 0.0166, "step": 89610 }, { "epoch": 0.97, "learning_rate": 0.00015467341246675747, "loss": 0.0119, "step": 89620 }, { "epoch": 0.97, "learning_rate": 0.00015465719660115454, "loss": 0.0159, "step": 89630 }, { "epoch": 0.97, "learning_rate": 0.00015464098073555163, "loss": 0.0131, "step": 89640 }, { "epoch": 0.97, "learning_rate": 0.00015462476486994875, "loss": 0.0121, "step": 89650 }, { "epoch": 0.97, "learning_rate": 0.00015460854900434584, "loss": 0.0135, "step": 89660 }, { "epoch": 0.97, "learning_rate": 0.0001545923331387429, "loss": 0.0158, "step": 89670 }, { "epoch": 0.97, "learning_rate": 0.00015457611727314003, "loss": 0.0128, "step": 89680 }, { "epoch": 0.97, "learning_rate": 0.00015455990140753712, "loss": 0.0113, "step": 89690 }, { "epoch": 0.97, "learning_rate": 0.00015454368554193422, "loss": 0.0143, "step": 89700 }, { "epoch": 0.97, "learning_rate": 0.0001545274696763313, "loss": 0.0127, "step": 89710 }, { "epoch": 0.97, "learning_rate": 0.0001545112538107284, "loss": 0.0114, "step": 89720 }, { "epoch": 0.97, "learning_rate": 0.0001544950379451255, "loss": 0.0112, "step": 89730 }, { "epoch": 0.97, "learning_rate": 0.0001544788220795226, "loss": 0.013, "step": 89740 }, { "epoch": 0.97, "learning_rate": 0.00015446260621391968, "loss": 0.0121, "step": 89750 }, { "epoch": 0.97, "learning_rate": 0.00015444639034831677, "loss": 0.0121, "step": 89760 }, { "epoch": 0.97, "learning_rate": 0.00015443017448271386, "loss": 0.0106, "step": 89770 }, { "epoch": 0.97, "learning_rate": 0.00015441395861711098, "loss": 0.0112, "step": 89780 }, { "epoch": 0.97, "learning_rate": 0.00015439774275150805, "loss": 0.0127, "step": 89790 }, { "epoch": 0.97, "learning_rate": 0.00015438152688590514, "loss": 0.0117, "step": 89800 }, { "epoch": 0.97, "learning_rate": 0.00015436531102030226, "loss": 0.0135, "step": 89810 }, { "epoch": 0.97, "learning_rate": 0.00015434909515469936, "loss": 0.0107, "step": 89820 }, { "epoch": 0.97, "learning_rate": 0.00015433287928909642, "loss": 0.0148, "step": 89830 }, { "epoch": 0.97, "learning_rate": 0.00015431666342349351, "loss": 0.0094, "step": 89840 }, { "epoch": 0.97, "learning_rate": 0.00015430044755789063, "loss": 0.0141, "step": 89850 }, { "epoch": 0.97, "learning_rate": 0.00015428423169228773, "loss": 0.0124, "step": 89860 }, { "epoch": 0.97, "learning_rate": 0.0001542680158266848, "loss": 0.0147, "step": 89870 }, { "epoch": 0.97, "learning_rate": 0.0001542517999610819, "loss": 0.0118, "step": 89880 }, { "epoch": 0.97, "learning_rate": 0.000154235584095479, "loss": 0.0166, "step": 89890 }, { "epoch": 0.97, "learning_rate": 0.0001542193682298761, "loss": 0.0131, "step": 89900 }, { "epoch": 0.97, "learning_rate": 0.00015420315236427316, "loss": 0.0153, "step": 89910 }, { "epoch": 0.97, "learning_rate": 0.00015418693649867028, "loss": 0.0114, "step": 89920 }, { "epoch": 0.97, "learning_rate": 0.00015417072063306738, "loss": 0.0157, "step": 89930 }, { "epoch": 0.97, "learning_rate": 0.0001541545047674645, "loss": 0.0136, "step": 89940 }, { "epoch": 0.97, "learning_rate": 0.0001541382889018616, "loss": 0.0128, "step": 89950 }, { "epoch": 0.97, "learning_rate": 0.00015412207303625865, "loss": 0.0115, "step": 89960 }, { "epoch": 0.97, "learning_rate": 0.00015410585717065575, "loss": 0.0119, "step": 89970 }, { "epoch": 0.97, "learning_rate": 0.00015408964130505287, "loss": 0.0121, "step": 89980 }, { "epoch": 0.97, "learning_rate": 0.00015407342543944996, "loss": 0.0107, "step": 89990 }, { "epoch": 0.97, "learning_rate": 0.00015405720957384702, "loss": 0.0098, "step": 90000 }, { "epoch": 0.97, "eval_cer": 0.9215616786273294, "eval_loss": 0.009352602064609528, "eval_runtime": 121.4051, "eval_samples_per_second": 16.474, "eval_steps_per_second": 4.118, "step": 90000 }, { "epoch": 0.97, "learning_rate": 0.00015404099370824414, "loss": 0.0143, "step": 90010 }, { "epoch": 0.97, "learning_rate": 0.00015402477784264124, "loss": 0.0109, "step": 90020 }, { "epoch": 0.97, "learning_rate": 0.00015400856197703833, "loss": 0.0133, "step": 90030 }, { "epoch": 0.97, "learning_rate": 0.0001539923461114354, "loss": 0.0097, "step": 90040 }, { "epoch": 0.97, "learning_rate": 0.00015397613024583252, "loss": 0.0134, "step": 90050 }, { "epoch": 0.97, "learning_rate": 0.0001539599143802296, "loss": 0.0111, "step": 90060 }, { "epoch": 0.97, "learning_rate": 0.0001539436985146267, "loss": 0.013, "step": 90070 }, { "epoch": 0.97, "learning_rate": 0.0001539274826490238, "loss": 0.0127, "step": 90080 }, { "epoch": 0.97, "learning_rate": 0.0001539112667834209, "loss": 0.0151, "step": 90090 }, { "epoch": 0.97, "learning_rate": 0.00015389505091781798, "loss": 0.0095, "step": 90100 }, { "epoch": 0.97, "learning_rate": 0.0001538788350522151, "loss": 0.0147, "step": 90110 }, { "epoch": 0.97, "learning_rate": 0.00015386261918661216, "loss": 0.0135, "step": 90120 }, { "epoch": 0.97, "learning_rate": 0.00015384640332100926, "loss": 0.0127, "step": 90130 }, { "epoch": 0.97, "learning_rate": 0.00015383018745540635, "loss": 0.0127, "step": 90140 }, { "epoch": 0.97, "learning_rate": 0.00015381397158980347, "loss": 0.0129, "step": 90150 }, { "epoch": 0.97, "learning_rate": 0.00015379775572420054, "loss": 0.0136, "step": 90160 }, { "epoch": 0.97, "learning_rate": 0.00015378153985859763, "loss": 0.012, "step": 90170 }, { "epoch": 0.97, "learning_rate": 0.00015376532399299475, "loss": 0.0109, "step": 90180 }, { "epoch": 0.97, "learning_rate": 0.00015374910812739184, "loss": 0.012, "step": 90190 }, { "epoch": 0.98, "learning_rate": 0.0001537328922617889, "loss": 0.0128, "step": 90200 }, { "epoch": 0.98, "learning_rate": 0.000153716676396186, "loss": 0.014, "step": 90210 }, { "epoch": 0.98, "learning_rate": 0.00015370046053058312, "loss": 0.0121, "step": 90220 }, { "epoch": 0.98, "learning_rate": 0.0001536842446649802, "loss": 0.0143, "step": 90230 }, { "epoch": 0.98, "learning_rate": 0.00015366802879937728, "loss": 0.0162, "step": 90240 }, { "epoch": 0.98, "learning_rate": 0.0001536518129337744, "loss": 0.0122, "step": 90250 }, { "epoch": 0.98, "learning_rate": 0.0001536355970681715, "loss": 0.011, "step": 90260 }, { "epoch": 0.98, "learning_rate": 0.00015361938120256858, "loss": 0.0144, "step": 90270 }, { "epoch": 0.98, "learning_rate": 0.00015360316533696565, "loss": 0.0125, "step": 90280 }, { "epoch": 0.98, "learning_rate": 0.00015358694947136277, "loss": 0.0117, "step": 90290 }, { "epoch": 0.98, "learning_rate": 0.00015357073360575986, "loss": 0.0193, "step": 90300 }, { "epoch": 0.98, "learning_rate": 0.00015355451774015698, "loss": 0.0116, "step": 90310 }, { "epoch": 0.98, "learning_rate": 0.00015353830187455405, "loss": 0.014, "step": 90320 }, { "epoch": 0.98, "learning_rate": 0.00015352208600895114, "loss": 0.0141, "step": 90330 }, { "epoch": 0.98, "learning_rate": 0.00015350587014334823, "loss": 0.0123, "step": 90340 }, { "epoch": 0.98, "learning_rate": 0.00015348965427774535, "loss": 0.0117, "step": 90350 }, { "epoch": 0.98, "learning_rate": 0.00015347343841214242, "loss": 0.0114, "step": 90360 }, { "epoch": 0.98, "learning_rate": 0.0001534572225465395, "loss": 0.0145, "step": 90370 }, { "epoch": 0.98, "learning_rate": 0.00015344100668093663, "loss": 0.0121, "step": 90380 }, { "epoch": 0.98, "learning_rate": 0.00015342479081533372, "loss": 0.0131, "step": 90390 }, { "epoch": 0.98, "learning_rate": 0.0001534085749497308, "loss": 0.0121, "step": 90400 }, { "epoch": 0.98, "learning_rate": 0.00015339235908412788, "loss": 0.0157, "step": 90410 }, { "epoch": 0.98, "learning_rate": 0.000153376143218525, "loss": 0.013, "step": 90420 }, { "epoch": 0.98, "learning_rate": 0.0001533599273529221, "loss": 0.0167, "step": 90430 }, { "epoch": 0.98, "learning_rate": 0.00015334371148731916, "loss": 0.0146, "step": 90440 }, { "epoch": 0.98, "learning_rate": 0.00015332749562171628, "loss": 0.0128, "step": 90450 }, { "epoch": 0.98, "learning_rate": 0.00015331127975611337, "loss": 0.0111, "step": 90460 }, { "epoch": 0.98, "learning_rate": 0.00015329506389051046, "loss": 0.0163, "step": 90470 }, { "epoch": 0.98, "learning_rate": 0.00015327884802490753, "loss": 0.0119, "step": 90480 }, { "epoch": 0.98, "learning_rate": 0.00015326263215930465, "loss": 0.0116, "step": 90490 }, { "epoch": 0.98, "learning_rate": 0.00015324641629370174, "loss": 0.0139, "step": 90500 }, { "epoch": 0.98, "learning_rate": 0.00015323020042809884, "loss": 0.0134, "step": 90510 }, { "epoch": 0.98, "learning_rate": 0.00015321398456249593, "loss": 0.0105, "step": 90520 }, { "epoch": 0.98, "learning_rate": 0.00015319776869689302, "loss": 0.0115, "step": 90530 }, { "epoch": 0.98, "learning_rate": 0.00015318155283129011, "loss": 0.0132, "step": 90540 }, { "epoch": 0.98, "learning_rate": 0.00015316533696568723, "loss": 0.0105, "step": 90550 }, { "epoch": 0.98, "learning_rate": 0.0001531491211000843, "loss": 0.011, "step": 90560 }, { "epoch": 0.98, "learning_rate": 0.0001531329052344814, "loss": 0.0154, "step": 90570 }, { "epoch": 0.98, "learning_rate": 0.00015311668936887849, "loss": 0.0118, "step": 90580 }, { "epoch": 0.98, "learning_rate": 0.0001531004735032756, "loss": 0.0124, "step": 90590 }, { "epoch": 0.98, "learning_rate": 0.00015308425763767267, "loss": 0.0154, "step": 90600 }, { "epoch": 0.98, "learning_rate": 0.00015306804177206976, "loss": 0.0126, "step": 90610 }, { "epoch": 0.98, "learning_rate": 0.00015305182590646688, "loss": 0.0113, "step": 90620 }, { "epoch": 0.98, "learning_rate": 0.00015303561004086398, "loss": 0.0103, "step": 90630 }, { "epoch": 0.98, "learning_rate": 0.00015301939417526107, "loss": 0.0126, "step": 90640 }, { "epoch": 0.98, "learning_rate": 0.00015300317830965813, "loss": 0.0136, "step": 90650 }, { "epoch": 0.98, "learning_rate": 0.00015298696244405525, "loss": 0.012, "step": 90660 }, { "epoch": 0.98, "learning_rate": 0.00015297074657845235, "loss": 0.0138, "step": 90670 }, { "epoch": 0.98, "learning_rate": 0.00015295453071284947, "loss": 0.0153, "step": 90680 }, { "epoch": 0.98, "learning_rate": 0.00015293831484724653, "loss": 0.012, "step": 90690 }, { "epoch": 0.98, "learning_rate": 0.00015292209898164363, "loss": 0.0123, "step": 90700 }, { "epoch": 0.98, "learning_rate": 0.00015290588311604072, "loss": 0.0122, "step": 90710 }, { "epoch": 0.98, "learning_rate": 0.00015288966725043784, "loss": 0.0124, "step": 90720 }, { "epoch": 0.98, "learning_rate": 0.0001528734513848349, "loss": 0.0109, "step": 90730 }, { "epoch": 0.98, "learning_rate": 0.000152857235519232, "loss": 0.012, "step": 90740 }, { "epoch": 0.98, "learning_rate": 0.00015284101965362912, "loss": 0.0102, "step": 90750 }, { "epoch": 0.98, "learning_rate": 0.0001528248037880262, "loss": 0.0151, "step": 90760 }, { "epoch": 0.98, "learning_rate": 0.00015280858792242327, "loss": 0.0149, "step": 90770 }, { "epoch": 0.98, "learning_rate": 0.00015279237205682037, "loss": 0.0153, "step": 90780 }, { "epoch": 0.98, "learning_rate": 0.0001527761561912175, "loss": 0.0137, "step": 90790 }, { "epoch": 0.98, "learning_rate": 0.00015275994032561458, "loss": 0.0164, "step": 90800 }, { "epoch": 0.98, "learning_rate": 0.00015274372446001165, "loss": 0.0134, "step": 90810 }, { "epoch": 0.98, "learning_rate": 0.00015272750859440877, "loss": 0.0117, "step": 90820 }, { "epoch": 0.98, "learning_rate": 0.00015271129272880586, "loss": 0.0094, "step": 90830 }, { "epoch": 0.98, "learning_rate": 0.00015269507686320295, "loss": 0.0105, "step": 90840 }, { "epoch": 0.98, "learning_rate": 0.00015267886099760002, "loss": 0.0147, "step": 90850 }, { "epoch": 0.98, "learning_rate": 0.00015266264513199714, "loss": 0.0137, "step": 90860 }, { "epoch": 0.98, "learning_rate": 0.00015264642926639423, "loss": 0.0108, "step": 90870 }, { "epoch": 0.98, "learning_rate": 0.00015263021340079132, "loss": 0.0171, "step": 90880 }, { "epoch": 0.98, "learning_rate": 0.00015261399753518841, "loss": 0.0163, "step": 90890 }, { "epoch": 0.98, "learning_rate": 0.0001525977816695855, "loss": 0.0102, "step": 90900 }, { "epoch": 0.98, "learning_rate": 0.0001525815658039826, "loss": 0.0135, "step": 90910 }, { "epoch": 0.98, "learning_rate": 0.00015256534993837972, "loss": 0.0131, "step": 90920 }, { "epoch": 0.98, "learning_rate": 0.00015254913407277679, "loss": 0.0135, "step": 90930 }, { "epoch": 0.98, "learning_rate": 0.00015253291820717388, "loss": 0.0111, "step": 90940 }, { "epoch": 0.98, "learning_rate": 0.00015251670234157097, "loss": 0.0138, "step": 90950 }, { "epoch": 0.98, "learning_rate": 0.0001525004864759681, "loss": 0.0134, "step": 90960 }, { "epoch": 0.98, "learning_rate": 0.00015248427061036516, "loss": 0.014, "step": 90970 }, { "epoch": 0.98, "learning_rate": 0.00015246805474476225, "loss": 0.0103, "step": 90980 }, { "epoch": 0.98, "learning_rate": 0.00015245183887915937, "loss": 0.0149, "step": 90990 }, { "epoch": 0.98, "learning_rate": 0.00015243562301355646, "loss": 0.0137, "step": 91000 }, { "epoch": 0.98, "eval_cer": 0.9215460437741146, "eval_loss": 0.00892550777643919, "eval_runtime": 121.1506, "eval_samples_per_second": 16.508, "eval_steps_per_second": 4.127, "step": 91000 }, { "epoch": 0.98, "learning_rate": 0.00015241940714795353, "loss": 0.013, "step": 91010 }, { "epoch": 0.98, "learning_rate": 0.00015240319128235065, "loss": 0.0129, "step": 91020 }, { "epoch": 0.98, "learning_rate": 0.00015238697541674774, "loss": 0.0135, "step": 91030 }, { "epoch": 0.98, "learning_rate": 0.00015237075955114483, "loss": 0.0144, "step": 91040 }, { "epoch": 0.98, "learning_rate": 0.0001523545436855419, "loss": 0.016, "step": 91050 }, { "epoch": 0.98, "learning_rate": 0.00015233832781993902, "loss": 0.0112, "step": 91060 }, { "epoch": 0.98, "learning_rate": 0.0001523221119543361, "loss": 0.0126, "step": 91070 }, { "epoch": 0.98, "learning_rate": 0.0001523058960887332, "loss": 0.0119, "step": 91080 }, { "epoch": 0.98, "learning_rate": 0.0001522896802231303, "loss": 0.0137, "step": 91090 }, { "epoch": 0.98, "learning_rate": 0.0001522734643575274, "loss": 0.0095, "step": 91100 }, { "epoch": 0.98, "learning_rate": 0.00015225724849192448, "loss": 0.0108, "step": 91110 }, { "epoch": 0.99, "learning_rate": 0.0001522410326263216, "loss": 0.0134, "step": 91120 }, { "epoch": 0.99, "learning_rate": 0.00015222481676071867, "loss": 0.0108, "step": 91130 }, { "epoch": 0.99, "learning_rate": 0.00015220860089511576, "loss": 0.0139, "step": 91140 }, { "epoch": 0.99, "learning_rate": 0.00015219238502951285, "loss": 0.0111, "step": 91150 }, { "epoch": 0.99, "learning_rate": 0.00015217616916390997, "loss": 0.0103, "step": 91160 }, { "epoch": 0.99, "learning_rate": 0.00015215995329830704, "loss": 0.0119, "step": 91170 }, { "epoch": 0.99, "learning_rate": 0.00015214373743270413, "loss": 0.0124, "step": 91180 }, { "epoch": 0.99, "learning_rate": 0.00015212752156710125, "loss": 0.0154, "step": 91190 }, { "epoch": 0.99, "learning_rate": 0.00015211130570149834, "loss": 0.015, "step": 91200 }, { "epoch": 0.99, "learning_rate": 0.0001520950898358954, "loss": 0.0116, "step": 91210 }, { "epoch": 0.99, "learning_rate": 0.0001520788739702925, "loss": 0.0101, "step": 91220 }, { "epoch": 0.99, "learning_rate": 0.00015206265810468962, "loss": 0.0123, "step": 91230 }, { "epoch": 0.99, "learning_rate": 0.00015204644223908671, "loss": 0.0115, "step": 91240 }, { "epoch": 0.99, "learning_rate": 0.00015203022637348378, "loss": 0.0142, "step": 91250 }, { "epoch": 0.99, "learning_rate": 0.0001520140105078809, "loss": 0.0132, "step": 91260 }, { "epoch": 0.99, "learning_rate": 0.000151997794642278, "loss": 0.0101, "step": 91270 }, { "epoch": 0.99, "learning_rate": 0.00015198157877667509, "loss": 0.0123, "step": 91280 }, { "epoch": 0.99, "learning_rate": 0.00015196536291107215, "loss": 0.0148, "step": 91290 }, { "epoch": 0.99, "learning_rate": 0.00015194914704546927, "loss": 0.0127, "step": 91300 }, { "epoch": 0.99, "learning_rate": 0.00015193293117986636, "loss": 0.0143, "step": 91310 }, { "epoch": 0.99, "learning_rate": 0.00015191671531426348, "loss": 0.0157, "step": 91320 }, { "epoch": 0.99, "learning_rate": 0.00015190049944866055, "loss": 0.0095, "step": 91330 }, { "epoch": 0.99, "learning_rate": 0.00015188428358305764, "loss": 0.0142, "step": 91340 }, { "epoch": 0.99, "learning_rate": 0.00015186806771745473, "loss": 0.0165, "step": 91350 }, { "epoch": 0.99, "learning_rate": 0.00015185185185185185, "loss": 0.0163, "step": 91360 }, { "epoch": 0.99, "learning_rate": 0.00015183563598624895, "loss": 0.0127, "step": 91370 }, { "epoch": 0.99, "learning_rate": 0.000151819420120646, "loss": 0.0138, "step": 91380 }, { "epoch": 0.99, "learning_rate": 0.00015180320425504313, "loss": 0.0135, "step": 91390 }, { "epoch": 0.99, "learning_rate": 0.00015178698838944023, "loss": 0.015, "step": 91400 }, { "epoch": 0.99, "learning_rate": 0.00015177077252383732, "loss": 0.0117, "step": 91410 }, { "epoch": 0.99, "learning_rate": 0.00015175455665823438, "loss": 0.0104, "step": 91420 }, { "epoch": 0.99, "learning_rate": 0.0001517383407926315, "loss": 0.013, "step": 91430 }, { "epoch": 0.99, "learning_rate": 0.0001517221249270286, "loss": 0.0114, "step": 91440 }, { "epoch": 0.99, "learning_rate": 0.0001517059090614257, "loss": 0.0118, "step": 91450 }, { "epoch": 0.99, "learning_rate": 0.00015168969319582278, "loss": 0.0103, "step": 91460 }, { "epoch": 0.99, "learning_rate": 0.00015167347733021987, "loss": 0.0095, "step": 91470 }, { "epoch": 0.99, "learning_rate": 0.00015165726146461697, "loss": 0.0156, "step": 91480 }, { "epoch": 0.99, "learning_rate": 0.0001516410455990141, "loss": 0.0134, "step": 91490 }, { "epoch": 0.99, "learning_rate": 0.00015162482973341115, "loss": 0.0108, "step": 91500 }, { "epoch": 0.99, "learning_rate": 0.00015160861386780825, "loss": 0.0148, "step": 91510 }, { "epoch": 0.99, "learning_rate": 0.00015159239800220534, "loss": 0.01, "step": 91520 }, { "epoch": 0.99, "learning_rate": 0.00015157618213660246, "loss": 0.0111, "step": 91530 }, { "epoch": 0.99, "learning_rate": 0.00015155996627099952, "loss": 0.011, "step": 91540 }, { "epoch": 0.99, "learning_rate": 0.00015154375040539662, "loss": 0.0124, "step": 91550 }, { "epoch": 0.99, "learning_rate": 0.00015152753453979374, "loss": 0.015, "step": 91560 }, { "epoch": 0.99, "learning_rate": 0.00015151131867419083, "loss": 0.0119, "step": 91570 }, { "epoch": 0.99, "learning_rate": 0.0001514951028085879, "loss": 0.0132, "step": 91580 }, { "epoch": 0.99, "learning_rate": 0.000151478886942985, "loss": 0.0146, "step": 91590 }, { "epoch": 0.99, "learning_rate": 0.0001514626710773821, "loss": 0.0133, "step": 91600 }, { "epoch": 0.99, "learning_rate": 0.0001514464552117792, "loss": 0.0137, "step": 91610 }, { "epoch": 0.99, "learning_rate": 0.00015143023934617627, "loss": 0.012, "step": 91620 }, { "epoch": 0.99, "learning_rate": 0.00015141402348057339, "loss": 0.0106, "step": 91630 }, { "epoch": 0.99, "learning_rate": 0.00015139780761497048, "loss": 0.0115, "step": 91640 }, { "epoch": 0.99, "learning_rate": 0.00015138159174936757, "loss": 0.0144, "step": 91650 }, { "epoch": 0.99, "learning_rate": 0.00015136537588376464, "loss": 0.0126, "step": 91660 }, { "epoch": 0.99, "learning_rate": 0.00015134916001816176, "loss": 0.011, "step": 91670 }, { "epoch": 0.99, "learning_rate": 0.00015133294415255885, "loss": 0.0149, "step": 91680 }, { "epoch": 0.99, "learning_rate": 0.00015131672828695597, "loss": 0.0119, "step": 91690 }, { "epoch": 0.99, "learning_rate": 0.00015130051242135303, "loss": 0.011, "step": 91700 }, { "epoch": 0.99, "learning_rate": 0.00015128429655575013, "loss": 0.0118, "step": 91710 }, { "epoch": 0.99, "learning_rate": 0.00015126808069014722, "loss": 0.012, "step": 91720 }, { "epoch": 0.99, "learning_rate": 0.00015125186482454434, "loss": 0.0101, "step": 91730 }, { "epoch": 0.99, "learning_rate": 0.0001512356489589414, "loss": 0.013, "step": 91740 }, { "epoch": 0.99, "learning_rate": 0.0001512194330933385, "loss": 0.0153, "step": 91750 }, { "epoch": 0.99, "learning_rate": 0.00015120321722773562, "loss": 0.0096, "step": 91760 }, { "epoch": 0.99, "learning_rate": 0.0001511870013621327, "loss": 0.0114, "step": 91770 }, { "epoch": 0.99, "learning_rate": 0.00015117078549652978, "loss": 0.0128, "step": 91780 }, { "epoch": 0.99, "learning_rate": 0.00015115456963092687, "loss": 0.0107, "step": 91790 }, { "epoch": 0.99, "learning_rate": 0.000151138353765324, "loss": 0.0125, "step": 91800 }, { "epoch": 0.99, "learning_rate": 0.00015112213789972108, "loss": 0.012, "step": 91810 }, { "epoch": 0.99, "learning_rate": 0.00015110592203411815, "loss": 0.012, "step": 91820 }, { "epoch": 0.99, "learning_rate": 0.00015108970616851527, "loss": 0.0109, "step": 91830 }, { "epoch": 0.99, "learning_rate": 0.00015107349030291236, "loss": 0.0095, "step": 91840 }, { "epoch": 0.99, "learning_rate": 0.00015105727443730945, "loss": 0.0105, "step": 91850 }, { "epoch": 0.99, "learning_rate": 0.00015104105857170652, "loss": 0.0112, "step": 91860 }, { "epoch": 0.99, "learning_rate": 0.00015102484270610364, "loss": 0.0126, "step": 91870 }, { "epoch": 0.99, "learning_rate": 0.00015100862684050073, "loss": 0.0121, "step": 91880 }, { "epoch": 0.99, "learning_rate": 0.00015099241097489782, "loss": 0.0116, "step": 91890 }, { "epoch": 0.99, "learning_rate": 0.00015097619510929492, "loss": 0.0138, "step": 91900 }, { "epoch": 0.99, "learning_rate": 0.000150959979243692, "loss": 0.0118, "step": 91910 }, { "epoch": 0.99, "learning_rate": 0.0001509437633780891, "loss": 0.0114, "step": 91920 }, { "epoch": 0.99, "learning_rate": 0.00015092754751248622, "loss": 0.0118, "step": 91930 }, { "epoch": 0.99, "learning_rate": 0.0001509113316468833, "loss": 0.0131, "step": 91940 }, { "epoch": 0.99, "learning_rate": 0.00015089511578128038, "loss": 0.0122, "step": 91950 }, { "epoch": 0.99, "learning_rate": 0.00015087889991567747, "loss": 0.015, "step": 91960 }, { "epoch": 0.99, "learning_rate": 0.0001508626840500746, "loss": 0.0154, "step": 91970 }, { "epoch": 0.99, "learning_rate": 0.00015084646818447166, "loss": 0.0149, "step": 91980 }, { "epoch": 0.99, "learning_rate": 0.00015083025231886875, "loss": 0.0118, "step": 91990 }, { "epoch": 0.99, "learning_rate": 0.00015081403645326587, "loss": 0.0105, "step": 92000 }, { "epoch": 0.99, "eval_cer": 0.9215434379652454, "eval_loss": 0.009060974232852459, "eval_runtime": 121.4309, "eval_samples_per_second": 16.47, "eval_steps_per_second": 4.118, "step": 92000 }, { "epoch": 0.99, "learning_rate": 0.00015079782058766296, "loss": 0.0132, "step": 92010 }, { "epoch": 0.99, "learning_rate": 0.00015078160472206003, "loss": 0.016, "step": 92020 }, { "epoch": 0.99, "learning_rate": 0.00015076538885645715, "loss": 0.0131, "step": 92030 }, { "epoch": 0.99, "learning_rate": 0.00015074917299085424, "loss": 0.0105, "step": 92040 }, { "epoch": 1.0, "learning_rate": 0.00015073295712525134, "loss": 0.0125, "step": 92050 }, { "epoch": 1.0, "learning_rate": 0.0001507167412596484, "loss": 0.013, "step": 92060 }, { "epoch": 1.0, "learning_rate": 0.00015070052539404552, "loss": 0.0111, "step": 92070 }, { "epoch": 1.0, "learning_rate": 0.0001506843095284426, "loss": 0.0119, "step": 92080 }, { "epoch": 1.0, "learning_rate": 0.0001506680936628397, "loss": 0.0132, "step": 92090 }, { "epoch": 1.0, "learning_rate": 0.00015065187779723683, "loss": 0.0117, "step": 92100 }, { "epoch": 1.0, "learning_rate": 0.0001506356619316339, "loss": 0.0158, "step": 92110 }, { "epoch": 1.0, "learning_rate": 0.00015061944606603098, "loss": 0.0124, "step": 92120 }, { "epoch": 1.0, "learning_rate": 0.0001506032302004281, "loss": 0.0115, "step": 92130 }, { "epoch": 1.0, "learning_rate": 0.0001505870143348252, "loss": 0.0114, "step": 92140 }, { "epoch": 1.0, "learning_rate": 0.00015057079846922226, "loss": 0.0126, "step": 92150 }, { "epoch": 1.0, "learning_rate": 0.00015055458260361936, "loss": 0.0145, "step": 92160 }, { "epoch": 1.0, "learning_rate": 0.00015053836673801648, "loss": 0.0114, "step": 92170 }, { "epoch": 1.0, "learning_rate": 0.00015052215087241357, "loss": 0.013, "step": 92180 }, { "epoch": 1.0, "learning_rate": 0.00015050593500681063, "loss": 0.0159, "step": 92190 }, { "epoch": 1.0, "learning_rate": 0.00015048971914120775, "loss": 0.0113, "step": 92200 }, { "epoch": 1.0, "learning_rate": 0.00015047350327560485, "loss": 0.0131, "step": 92210 }, { "epoch": 1.0, "learning_rate": 0.00015045728741000194, "loss": 0.0123, "step": 92220 }, { "epoch": 1.0, "learning_rate": 0.000150441071544399, "loss": 0.0161, "step": 92230 }, { "epoch": 1.0, "learning_rate": 0.00015042485567879612, "loss": 0.0123, "step": 92240 }, { "epoch": 1.0, "learning_rate": 0.00015040863981319322, "loss": 0.012, "step": 92250 }, { "epoch": 1.0, "learning_rate": 0.00015039242394759034, "loss": 0.0143, "step": 92260 }, { "epoch": 1.0, "learning_rate": 0.0001503762080819874, "loss": 0.0117, "step": 92270 }, { "epoch": 1.0, "learning_rate": 0.0001503599922163845, "loss": 0.0107, "step": 92280 }, { "epoch": 1.0, "learning_rate": 0.0001503437763507816, "loss": 0.0115, "step": 92290 }, { "epoch": 1.0, "learning_rate": 0.0001503275604851787, "loss": 0.0109, "step": 92300 }, { "epoch": 1.0, "learning_rate": 0.00015031134461957577, "loss": 0.0108, "step": 92310 }, { "epoch": 1.0, "learning_rate": 0.00015029512875397287, "loss": 0.0131, "step": 92320 }, { "epoch": 1.0, "learning_rate": 0.00015027891288836999, "loss": 0.0136, "step": 92330 }, { "epoch": 1.0, "learning_rate": 0.00015026269702276708, "loss": 0.0126, "step": 92340 }, { "epoch": 1.0, "learning_rate": 0.00015024648115716414, "loss": 0.0139, "step": 92350 }, { "epoch": 1.0, "learning_rate": 0.00015023026529156124, "loss": 0.0113, "step": 92360 }, { "epoch": 1.0, "learning_rate": 0.00015021404942595836, "loss": 0.0121, "step": 92370 }, { "epoch": 1.0, "learning_rate": 0.00015019783356035545, "loss": 0.0135, "step": 92380 }, { "epoch": 1.0, "learning_rate": 0.00015018161769475252, "loss": 0.0128, "step": 92390 }, { "epoch": 1.0, "learning_rate": 0.00015016540182914964, "loss": 0.0155, "step": 92400 }, { "epoch": 1.0, "learning_rate": 0.00015014918596354673, "loss": 0.0139, "step": 92410 }, { "epoch": 1.0, "learning_rate": 0.00015013297009794382, "loss": 0.0114, "step": 92420 }, { "epoch": 1.0, "learning_rate": 0.0001501167542323409, "loss": 0.0156, "step": 92430 }, { "epoch": 1.0, "learning_rate": 0.000150100538366738, "loss": 0.0109, "step": 92440 }, { "epoch": 1.0, "learning_rate": 0.0001500843225011351, "loss": 0.0094, "step": 92450 }, { "epoch": 1.0, "learning_rate": 0.0001500681066355322, "loss": 0.0136, "step": 92460 }, { "epoch": 1.0, "learning_rate": 0.00015005189076992928, "loss": 0.0111, "step": 92470 }, { "epoch": 1.0, "learning_rate": 0.00015003567490432638, "loss": 0.0134, "step": 92480 }, { "epoch": 1.0, "learning_rate": 0.00015001945903872347, "loss": 0.0093, "step": 92490 }, { "epoch": 1.0, "learning_rate": 0.0001500032431731206, "loss": 0.0096, "step": 92500 }, { "epoch": 1.0, "learning_rate": 0.00014998702730751766, "loss": 0.0093, "step": 92510 }, { "epoch": 1.0, "learning_rate": 0.00014997081144191475, "loss": 0.0138, "step": 92520 }, { "epoch": 1.0, "learning_rate": 0.00014995459557631184, "loss": 0.0107, "step": 92530 }, { "epoch": 1.0, "learning_rate": 0.00014993837971070893, "loss": 0.0098, "step": 92540 }, { "epoch": 1.0, "learning_rate": 0.00014992216384510605, "loss": 0.0117, "step": 92550 }, { "epoch": 1.0, "learning_rate": 0.00014990594797950312, "loss": 0.0131, "step": 92560 }, { "epoch": 1.0, "learning_rate": 0.00014988973211390024, "loss": 0.0128, "step": 92570 }, { "epoch": 1.0, "learning_rate": 0.0001498735162482973, "loss": 0.0092, "step": 92580 }, { "epoch": 1.0, "learning_rate": 0.00014985730038269442, "loss": 0.0139, "step": 92590 }, { "epoch": 1.0, "learning_rate": 0.0001498410845170915, "loss": 0.0088, "step": 92600 }, { "epoch": 1.0, "learning_rate": 0.0001498248686514886, "loss": 0.0101, "step": 92610 }, { "epoch": 1.0, "learning_rate": 0.0001498086527858857, "loss": 0.0138, "step": 92620 }, { "epoch": 1.0, "learning_rate": 0.0001497924369202828, "loss": 0.0098, "step": 92630 }, { "epoch": 1.0, "learning_rate": 0.0001497762210546799, "loss": 0.014, "step": 92640 }, { "epoch": 1.0, "learning_rate": 0.00014976000518907698, "loss": 0.0089, "step": 92650 }, { "epoch": 1.0, "learning_rate": 0.00014974378932347407, "loss": 0.0123, "step": 92660 }, { "epoch": 1.0, "learning_rate": 0.00014972757345787117, "loss": 0.0092, "step": 92670 }, { "epoch": 1.0, "learning_rate": 0.00014971135759226826, "loss": 0.0125, "step": 92680 }, { "epoch": 1.0, "learning_rate": 0.00014969514172666535, "loss": 0.0099, "step": 92690 }, { "epoch": 1.0, "learning_rate": 0.00014967892586106244, "loss": 0.0126, "step": 92700 }, { "epoch": 1.0, "learning_rate": 0.00014966270999545954, "loss": 0.0114, "step": 92710 }, { "epoch": 1.0, "learning_rate": 0.00014964649412985663, "loss": 0.0114, "step": 92720 }, { "epoch": 1.0, "learning_rate": 0.00014963027826425372, "loss": 0.0077, "step": 92730 }, { "epoch": 1.0, "learning_rate": 0.00014961406239865082, "loss": 0.0095, "step": 92740 }, { "epoch": 1.0, "learning_rate": 0.0001495978465330479, "loss": 0.0125, "step": 92750 }, { "epoch": 1.0, "learning_rate": 0.000149581630667445, "loss": 0.01, "step": 92760 }, { "epoch": 1.0, "learning_rate": 0.00014956541480184212, "loss": 0.0113, "step": 92770 }, { "epoch": 1.0, "learning_rate": 0.0001495491989362392, "loss": 0.0108, "step": 92780 }, { "epoch": 1.0, "learning_rate": 0.0001495329830706363, "loss": 0.0103, "step": 92790 }, { "epoch": 1.0, "learning_rate": 0.0001495167672050334, "loss": 0.011, "step": 92800 }, { "epoch": 1.0, "learning_rate": 0.0001495005513394305, "loss": 0.0098, "step": 92810 }, { "epoch": 1.0, "learning_rate": 0.00014948433547382758, "loss": 0.0096, "step": 92820 }, { "epoch": 1.0, "learning_rate": 0.00014946811960822468, "loss": 0.0103, "step": 92830 }, { "epoch": 1.0, "learning_rate": 0.00014945190374262177, "loss": 0.0086, "step": 92840 }, { "epoch": 1.0, "learning_rate": 0.00014943568787701886, "loss": 0.0094, "step": 92850 }, { "epoch": 1.0, "learning_rate": 0.00014941947201141596, "loss": 0.0107, "step": 92860 }, { "epoch": 1.0, "learning_rate": 0.00014940325614581305, "loss": 0.0128, "step": 92870 }, { "epoch": 1.0, "learning_rate": 0.00014938704028021014, "loss": 0.013, "step": 92880 }, { "epoch": 1.0, "learning_rate": 0.00014937082441460723, "loss": 0.0113, "step": 92890 }, { "epoch": 1.0, "learning_rate": 0.00014935460854900433, "loss": 0.0117, "step": 92900 }, { "epoch": 1.0, "learning_rate": 0.00014933839268340142, "loss": 0.012, "step": 92910 }, { "epoch": 1.0, "learning_rate": 0.00014932217681779854, "loss": 0.0142, "step": 92920 }, { "epoch": 1.0, "learning_rate": 0.0001493059609521956, "loss": 0.0097, "step": 92930 }, { "epoch": 1.0, "learning_rate": 0.00014928974508659272, "loss": 0.0147, "step": 92940 }, { "epoch": 1.0, "learning_rate": 0.0001492735292209898, "loss": 0.0109, "step": 92950 }, { "epoch": 1.0, "learning_rate": 0.0001492573133553869, "loss": 0.0133, "step": 92960 }, { "epoch": 1.01, "learning_rate": 0.00014924109748978398, "loss": 0.0109, "step": 92970 }, { "epoch": 1.01, "learning_rate": 0.0001492248816241811, "loss": 0.0102, "step": 92980 }, { "epoch": 1.01, "learning_rate": 0.0001492086657585782, "loss": 0.0131, "step": 92990 }, { "epoch": 1.01, "learning_rate": 0.00014919244989297528, "loss": 0.01, "step": 93000 }, { "epoch": 1.01, "eval_cer": 0.9215599414214166, "eval_loss": 0.008955257013440132, "eval_runtime": 121.985, "eval_samples_per_second": 16.395, "eval_steps_per_second": 4.099, "step": 93000 }, { "epoch": 1.01, "learning_rate": 0.00014917623402737237, "loss": 0.0093, "step": 93010 }, { "epoch": 1.01, "learning_rate": 0.00014916001816176947, "loss": 0.011, "step": 93020 }, { "epoch": 1.01, "learning_rate": 0.00014914380229616656, "loss": 0.0098, "step": 93030 }, { "epoch": 1.01, "learning_rate": 0.00014912758643056365, "loss": 0.0138, "step": 93040 }, { "epoch": 1.01, "learning_rate": 0.00014911137056496075, "loss": 0.0113, "step": 93050 }, { "epoch": 1.01, "learning_rate": 0.00014909515469935784, "loss": 0.0107, "step": 93060 }, { "epoch": 1.01, "learning_rate": 0.00014907893883375493, "loss": 0.0111, "step": 93070 }, { "epoch": 1.01, "learning_rate": 0.00014906272296815202, "loss": 0.0105, "step": 93080 }, { "epoch": 1.01, "learning_rate": 0.00014904650710254912, "loss": 0.0089, "step": 93090 }, { "epoch": 1.01, "learning_rate": 0.0001490302912369462, "loss": 0.009, "step": 93100 }, { "epoch": 1.01, "learning_rate": 0.0001490140753713433, "loss": 0.0112, "step": 93110 }, { "epoch": 1.01, "learning_rate": 0.00014899785950574042, "loss": 0.0105, "step": 93120 }, { "epoch": 1.01, "learning_rate": 0.0001489816436401375, "loss": 0.0104, "step": 93130 }, { "epoch": 1.01, "learning_rate": 0.0001489654277745346, "loss": 0.0111, "step": 93140 }, { "epoch": 1.01, "learning_rate": 0.00014894921190893167, "loss": 0.0151, "step": 93150 }, { "epoch": 1.01, "learning_rate": 0.0001489329960433288, "loss": 0.0088, "step": 93160 }, { "epoch": 1.01, "learning_rate": 0.00014891678017772586, "loss": 0.0101, "step": 93170 }, { "epoch": 1.01, "learning_rate": 0.00014890056431212298, "loss": 0.0126, "step": 93180 }, { "epoch": 1.01, "learning_rate": 0.00014888434844652007, "loss": 0.012, "step": 93190 }, { "epoch": 1.01, "learning_rate": 0.00014886813258091716, "loss": 0.0107, "step": 93200 }, { "epoch": 1.01, "learning_rate": 0.00014885191671531426, "loss": 0.0114, "step": 93210 }, { "epoch": 1.01, "learning_rate": 0.00014883570084971135, "loss": 0.0122, "step": 93220 }, { "epoch": 1.01, "learning_rate": 0.00014881948498410844, "loss": 0.0126, "step": 93230 }, { "epoch": 1.01, "learning_rate": 0.00014880326911850553, "loss": 0.0145, "step": 93240 }, { "epoch": 1.01, "learning_rate": 0.00014878705325290263, "loss": 0.0099, "step": 93250 }, { "epoch": 1.01, "learning_rate": 0.00014877083738729972, "loss": 0.012, "step": 93260 }, { "epoch": 1.01, "learning_rate": 0.0001487546215216968, "loss": 0.0121, "step": 93270 }, { "epoch": 1.01, "learning_rate": 0.0001487384056560939, "loss": 0.0105, "step": 93280 }, { "epoch": 1.01, "learning_rate": 0.000148722189790491, "loss": 0.0105, "step": 93290 }, { "epoch": 1.01, "learning_rate": 0.0001487059739248881, "loss": 0.0113, "step": 93300 }, { "epoch": 1.01, "learning_rate": 0.00014868975805928518, "loss": 0.0153, "step": 93310 }, { "epoch": 1.01, "learning_rate": 0.00014867354219368228, "loss": 0.0112, "step": 93320 }, { "epoch": 1.01, "learning_rate": 0.00014865732632807937, "loss": 0.012, "step": 93330 }, { "epoch": 1.01, "learning_rate": 0.0001486411104624765, "loss": 0.0118, "step": 93340 }, { "epoch": 1.01, "learning_rate": 0.00014862489459687355, "loss": 0.0097, "step": 93350 }, { "epoch": 1.01, "learning_rate": 0.00014860867873127067, "loss": 0.0081, "step": 93360 }, { "epoch": 1.01, "learning_rate": 0.00014859246286566774, "loss": 0.0126, "step": 93370 }, { "epoch": 1.01, "learning_rate": 0.00014857624700006486, "loss": 0.011, "step": 93380 }, { "epoch": 1.01, "learning_rate": 0.00014856003113446193, "loss": 0.0105, "step": 93390 }, { "epoch": 1.01, "learning_rate": 0.00014854381526885905, "loss": 0.0111, "step": 93400 }, { "epoch": 1.01, "learning_rate": 0.00014852759940325614, "loss": 0.0119, "step": 93410 }, { "epoch": 1.01, "learning_rate": 0.00014851138353765323, "loss": 0.0108, "step": 93420 }, { "epoch": 1.01, "learning_rate": 0.00014849516767205032, "loss": 0.0123, "step": 93430 }, { "epoch": 1.01, "learning_rate": 0.00014847895180644742, "loss": 0.0083, "step": 93440 }, { "epoch": 1.01, "learning_rate": 0.0001484627359408445, "loss": 0.0102, "step": 93450 }, { "epoch": 1.01, "learning_rate": 0.0001484465200752416, "loss": 0.011, "step": 93460 }, { "epoch": 1.01, "learning_rate": 0.0001484303042096387, "loss": 0.0134, "step": 93470 }, { "epoch": 1.01, "learning_rate": 0.0001484140883440358, "loss": 0.0107, "step": 93480 }, { "epoch": 1.01, "learning_rate": 0.00014839787247843288, "loss": 0.0107, "step": 93490 }, { "epoch": 1.01, "learning_rate": 0.00014838165661282997, "loss": 0.0096, "step": 93500 }, { "epoch": 1.01, "learning_rate": 0.0001483654407472271, "loss": 0.0103, "step": 93510 }, { "epoch": 1.01, "learning_rate": 0.00014834922488162416, "loss": 0.0112, "step": 93520 }, { "epoch": 1.01, "learning_rate": 0.00014833300901602128, "loss": 0.0123, "step": 93530 }, { "epoch": 1.01, "learning_rate": 0.00014831679315041834, "loss": 0.01, "step": 93540 }, { "epoch": 1.01, "learning_rate": 0.00014830057728481546, "loss": 0.0096, "step": 93550 }, { "epoch": 1.01, "learning_rate": 0.00014828436141921256, "loss": 0.0097, "step": 93560 }, { "epoch": 1.01, "learning_rate": 0.00014826814555360965, "loss": 0.0111, "step": 93570 }, { "epoch": 1.01, "learning_rate": 0.00014825192968800674, "loss": 0.0115, "step": 93580 }, { "epoch": 1.01, "learning_rate": 0.00014823571382240383, "loss": 0.0098, "step": 93590 }, { "epoch": 1.01, "learning_rate": 0.00014821949795680093, "loss": 0.0113, "step": 93600 }, { "epoch": 1.01, "learning_rate": 0.00014820328209119802, "loss": 0.0103, "step": 93610 }, { "epoch": 1.01, "learning_rate": 0.0001481870662255951, "loss": 0.0107, "step": 93620 }, { "epoch": 1.01, "learning_rate": 0.0001481708503599922, "loss": 0.0083, "step": 93630 }, { "epoch": 1.01, "learning_rate": 0.0001481546344943893, "loss": 0.0095, "step": 93640 }, { "epoch": 1.01, "learning_rate": 0.0001481384186287864, "loss": 0.0093, "step": 93650 }, { "epoch": 1.01, "learning_rate": 0.00014812220276318348, "loss": 0.013, "step": 93660 }, { "epoch": 1.01, "learning_rate": 0.00014810598689758058, "loss": 0.0111, "step": 93670 }, { "epoch": 1.01, "learning_rate": 0.00014808977103197767, "loss": 0.0135, "step": 93680 }, { "epoch": 1.01, "learning_rate": 0.00014807355516637476, "loss": 0.0126, "step": 93690 }, { "epoch": 1.01, "learning_rate": 0.00014805733930077185, "loss": 0.0109, "step": 93700 }, { "epoch": 1.01, "learning_rate": 0.00014804112343516897, "loss": 0.0116, "step": 93710 }, { "epoch": 1.01, "learning_rate": 0.00014802490756956604, "loss": 0.0118, "step": 93720 }, { "epoch": 1.01, "learning_rate": 0.00014800869170396316, "loss": 0.0125, "step": 93730 }, { "epoch": 1.01, "learning_rate": 0.00014799247583836023, "loss": 0.0118, "step": 93740 }, { "epoch": 1.01, "learning_rate": 0.00014797625997275735, "loss": 0.0098, "step": 93750 }, { "epoch": 1.01, "learning_rate": 0.0001479600441071544, "loss": 0.0117, "step": 93760 }, { "epoch": 1.01, "learning_rate": 0.00014794382824155153, "loss": 0.0128, "step": 93770 }, { "epoch": 1.01, "learning_rate": 0.00014792761237594862, "loss": 0.012, "step": 93780 }, { "epoch": 1.01, "learning_rate": 0.00014791139651034572, "loss": 0.0122, "step": 93790 }, { "epoch": 1.01, "learning_rate": 0.0001478951806447428, "loss": 0.0116, "step": 93800 }, { "epoch": 1.01, "learning_rate": 0.0001478789647791399, "loss": 0.008, "step": 93810 }, { "epoch": 1.01, "learning_rate": 0.000147862748913537, "loss": 0.0091, "step": 93820 }, { "epoch": 1.01, "learning_rate": 0.0001478465330479341, "loss": 0.0117, "step": 93830 }, { "epoch": 1.01, "learning_rate": 0.00014783031718233118, "loss": 0.0115, "step": 93840 }, { "epoch": 1.01, "learning_rate": 0.00014781410131672827, "loss": 0.0116, "step": 93850 }, { "epoch": 1.01, "learning_rate": 0.00014779788545112537, "loss": 0.0124, "step": 93860 }, { "epoch": 1.01, "learning_rate": 0.00014778166958552246, "loss": 0.009, "step": 93870 }, { "epoch": 1.01, "learning_rate": 0.00014776545371991955, "loss": 0.0137, "step": 93880 }, { "epoch": 1.01, "learning_rate": 0.00014774923785431664, "loss": 0.0111, "step": 93890 }, { "epoch": 1.02, "learning_rate": 0.00014773302198871374, "loss": 0.0104, "step": 93900 }, { "epoch": 1.02, "learning_rate": 0.00014771680612311083, "loss": 0.0119, "step": 93910 }, { "epoch": 1.02, "learning_rate": 0.00014770059025750792, "loss": 0.0091, "step": 93920 }, { "epoch": 1.02, "learning_rate": 0.00014768437439190504, "loss": 0.0101, "step": 93930 }, { "epoch": 1.02, "learning_rate": 0.0001476681585263021, "loss": 0.0132, "step": 93940 }, { "epoch": 1.02, "learning_rate": 0.00014765194266069923, "loss": 0.0124, "step": 93950 }, { "epoch": 1.02, "learning_rate": 0.0001476357267950963, "loss": 0.0109, "step": 93960 }, { "epoch": 1.02, "learning_rate": 0.0001476195109294934, "loss": 0.0103, "step": 93970 }, { "epoch": 1.02, "learning_rate": 0.00014760329506389048, "loss": 0.0131, "step": 93980 }, { "epoch": 1.02, "learning_rate": 0.0001475870791982876, "loss": 0.0135, "step": 93990 }, { "epoch": 1.02, "learning_rate": 0.0001475708633326847, "loss": 0.0103, "step": 94000 }, { "epoch": 1.02, "eval_cer": 0.9215634158332421, "eval_loss": 0.008654128760099411, "eval_runtime": 121.8962, "eval_samples_per_second": 16.407, "eval_steps_per_second": 4.102, "step": 94000 }, { "epoch": 1.02, "learning_rate": 0.00014755464746708178, "loss": 0.0152, "step": 94010 }, { "epoch": 1.02, "learning_rate": 0.00014753843160147888, "loss": 0.0115, "step": 94020 }, { "epoch": 1.02, "learning_rate": 0.00014752221573587597, "loss": 0.0104, "step": 94030 }, { "epoch": 1.02, "learning_rate": 0.00014750599987027306, "loss": 0.0096, "step": 94040 }, { "epoch": 1.02, "learning_rate": 0.00014748978400467015, "loss": 0.0104, "step": 94050 }, { "epoch": 1.02, "learning_rate": 0.00014747356813906725, "loss": 0.0124, "step": 94060 }, { "epoch": 1.02, "learning_rate": 0.00014745735227346434, "loss": 0.0106, "step": 94070 }, { "epoch": 1.02, "learning_rate": 0.00014744113640786143, "loss": 0.0132, "step": 94080 }, { "epoch": 1.02, "learning_rate": 0.00014742492054225853, "loss": 0.0097, "step": 94090 }, { "epoch": 1.02, "learning_rate": 0.00014740870467665562, "loss": 0.0093, "step": 94100 }, { "epoch": 1.02, "learning_rate": 0.0001473924888110527, "loss": 0.0092, "step": 94110 }, { "epoch": 1.02, "learning_rate": 0.0001473762729454498, "loss": 0.0118, "step": 94120 }, { "epoch": 1.02, "learning_rate": 0.0001473600570798469, "loss": 0.0118, "step": 94130 }, { "epoch": 1.02, "learning_rate": 0.000147343841214244, "loss": 0.0099, "step": 94140 }, { "epoch": 1.02, "learning_rate": 0.0001473276253486411, "loss": 0.0103, "step": 94150 }, { "epoch": 1.02, "learning_rate": 0.00014731140948303818, "loss": 0.0108, "step": 94160 }, { "epoch": 1.02, "learning_rate": 0.0001472951936174353, "loss": 0.0098, "step": 94170 }, { "epoch": 1.02, "learning_rate": 0.00014727897775183236, "loss": 0.0096, "step": 94180 }, { "epoch": 1.02, "learning_rate": 0.00014726276188622948, "loss": 0.0114, "step": 94190 }, { "epoch": 1.02, "learning_rate": 0.00014724654602062657, "loss": 0.0114, "step": 94200 }, { "epoch": 1.02, "learning_rate": 0.00014723033015502367, "loss": 0.0112, "step": 94210 }, { "epoch": 1.02, "learning_rate": 0.00014721411428942076, "loss": 0.0117, "step": 94220 }, { "epoch": 1.02, "learning_rate": 0.00014719789842381785, "loss": 0.01, "step": 94230 }, { "epoch": 1.02, "learning_rate": 0.00014718168255821494, "loss": 0.0098, "step": 94240 }, { "epoch": 1.02, "learning_rate": 0.00014716546669261204, "loss": 0.0133, "step": 94250 }, { "epoch": 1.02, "learning_rate": 0.00014714925082700913, "loss": 0.01, "step": 94260 }, { "epoch": 1.02, "learning_rate": 0.00014713303496140622, "loss": 0.0142, "step": 94270 }, { "epoch": 1.02, "learning_rate": 0.00014711681909580334, "loss": 0.0101, "step": 94280 }, { "epoch": 1.02, "learning_rate": 0.0001471006032302004, "loss": 0.0074, "step": 94290 }, { "epoch": 1.02, "learning_rate": 0.00014708438736459753, "loss": 0.0131, "step": 94300 }, { "epoch": 1.02, "learning_rate": 0.0001470681714989946, "loss": 0.0122, "step": 94310 }, { "epoch": 1.02, "learning_rate": 0.0001470519556333917, "loss": 0.0099, "step": 94320 }, { "epoch": 1.02, "learning_rate": 0.00014703573976778878, "loss": 0.0087, "step": 94330 }, { "epoch": 1.02, "learning_rate": 0.0001470195239021859, "loss": 0.0099, "step": 94340 }, { "epoch": 1.02, "learning_rate": 0.000147003308036583, "loss": 0.01, "step": 94350 }, { "epoch": 1.02, "learning_rate": 0.00014698709217098008, "loss": 0.011, "step": 94360 }, { "epoch": 1.02, "learning_rate": 0.00014697087630537718, "loss": 0.0096, "step": 94370 }, { "epoch": 1.02, "learning_rate": 0.00014695466043977427, "loss": 0.0079, "step": 94380 }, { "epoch": 1.02, "learning_rate": 0.00014693844457417136, "loss": 0.0114, "step": 94390 }, { "epoch": 1.02, "learning_rate": 0.00014692222870856846, "loss": 0.0106, "step": 94400 }, { "epoch": 1.02, "learning_rate": 0.00014690601284296555, "loss": 0.0099, "step": 94410 }, { "epoch": 1.02, "learning_rate": 0.00014688979697736264, "loss": 0.0103, "step": 94420 }, { "epoch": 1.02, "learning_rate": 0.00014687358111175973, "loss": 0.011, "step": 94430 }, { "epoch": 1.02, "learning_rate": 0.00014685736524615683, "loss": 0.0122, "step": 94440 }, { "epoch": 1.02, "learning_rate": 0.00014684114938055392, "loss": 0.011, "step": 94450 }, { "epoch": 1.02, "learning_rate": 0.000146824933514951, "loss": 0.0112, "step": 94460 }, { "epoch": 1.02, "learning_rate": 0.0001468087176493481, "loss": 0.0094, "step": 94470 }, { "epoch": 1.02, "learning_rate": 0.0001467925017837452, "loss": 0.0108, "step": 94480 }, { "epoch": 1.02, "learning_rate": 0.0001467762859181423, "loss": 0.01, "step": 94490 }, { "epoch": 1.02, "learning_rate": 0.0001467600700525394, "loss": 0.0122, "step": 94500 }, { "epoch": 1.02, "learning_rate": 0.00014674385418693648, "loss": 0.0113, "step": 94510 }, { "epoch": 1.02, "learning_rate": 0.0001467276383213336, "loss": 0.0098, "step": 94520 }, { "epoch": 1.02, "learning_rate": 0.00014671142245573066, "loss": 0.012, "step": 94530 }, { "epoch": 1.02, "learning_rate": 0.00014669520659012778, "loss": 0.0101, "step": 94540 }, { "epoch": 1.02, "learning_rate": 0.00014667899072452485, "loss": 0.0111, "step": 94550 }, { "epoch": 1.02, "learning_rate": 0.00014666277485892197, "loss": 0.0115, "step": 94560 }, { "epoch": 1.02, "learning_rate": 0.00014664655899331906, "loss": 0.0095, "step": 94570 }, { "epoch": 1.02, "learning_rate": 0.00014663034312771615, "loss": 0.0134, "step": 94580 }, { "epoch": 1.02, "learning_rate": 0.00014661412726211324, "loss": 0.0109, "step": 94590 }, { "epoch": 1.02, "learning_rate": 0.00014659791139651034, "loss": 0.0126, "step": 94600 }, { "epoch": 1.02, "learning_rate": 0.00014658169553090743, "loss": 0.0104, "step": 94610 }, { "epoch": 1.02, "learning_rate": 0.00014656547966530452, "loss": 0.0103, "step": 94620 }, { "epoch": 1.02, "learning_rate": 0.00014654926379970162, "loss": 0.0097, "step": 94630 }, { "epoch": 1.02, "learning_rate": 0.0001465330479340987, "loss": 0.0119, "step": 94640 }, { "epoch": 1.02, "learning_rate": 0.0001465168320684958, "loss": 0.01, "step": 94650 }, { "epoch": 1.02, "learning_rate": 0.0001465006162028929, "loss": 0.0107, "step": 94660 }, { "epoch": 1.02, "learning_rate": 0.00014648440033728999, "loss": 0.0104, "step": 94670 }, { "epoch": 1.02, "learning_rate": 0.00014646818447168708, "loss": 0.0106, "step": 94680 }, { "epoch": 1.02, "learning_rate": 0.00014645196860608417, "loss": 0.0114, "step": 94690 }, { "epoch": 1.02, "learning_rate": 0.00014643575274048126, "loss": 0.0118, "step": 94700 }, { "epoch": 1.02, "learning_rate": 0.00014641953687487836, "loss": 0.0104, "step": 94710 }, { "epoch": 1.02, "learning_rate": 0.00014640332100927548, "loss": 0.0117, "step": 94720 }, { "epoch": 1.02, "learning_rate": 0.00014638710514367254, "loss": 0.0092, "step": 94730 }, { "epoch": 1.02, "learning_rate": 0.00014637088927806966, "loss": 0.0144, "step": 94740 }, { "epoch": 1.02, "learning_rate": 0.00014635467341246673, "loss": 0.0113, "step": 94750 }, { "epoch": 1.02, "learning_rate": 0.00014633845754686385, "loss": 0.0109, "step": 94760 }, { "epoch": 1.02, "learning_rate": 0.00014632224168126091, "loss": 0.0105, "step": 94770 }, { "epoch": 1.02, "learning_rate": 0.00014630602581565803, "loss": 0.011, "step": 94780 }, { "epoch": 1.02, "learning_rate": 0.00014628980995005513, "loss": 0.0152, "step": 94790 }, { "epoch": 1.02, "learning_rate": 0.00014627359408445222, "loss": 0.01, "step": 94800 }, { "epoch": 1.02, "learning_rate": 0.0001462573782188493, "loss": 0.0111, "step": 94810 }, { "epoch": 1.03, "learning_rate": 0.0001462411623532464, "loss": 0.0106, "step": 94820 }, { "epoch": 1.03, "learning_rate": 0.0001462249464876435, "loss": 0.0102, "step": 94830 }, { "epoch": 1.03, "learning_rate": 0.0001462087306220406, "loss": 0.0107, "step": 94840 }, { "epoch": 1.03, "learning_rate": 0.00014619251475643768, "loss": 0.0127, "step": 94850 }, { "epoch": 1.03, "learning_rate": 0.00014617629889083478, "loss": 0.0117, "step": 94860 }, { "epoch": 1.03, "learning_rate": 0.00014616008302523187, "loss": 0.0098, "step": 94870 }, { "epoch": 1.03, "learning_rate": 0.00014614386715962896, "loss": 0.0114, "step": 94880 }, { "epoch": 1.03, "learning_rate": 0.00014612765129402605, "loss": 0.0108, "step": 94890 }, { "epoch": 1.03, "learning_rate": 0.00014611143542842315, "loss": 0.0119, "step": 94900 }, { "epoch": 1.03, "learning_rate": 0.00014609521956282024, "loss": 0.0095, "step": 94910 }, { "epoch": 1.03, "learning_rate": 0.00014607900369721733, "loss": 0.0103, "step": 94920 }, { "epoch": 1.03, "learning_rate": 0.00014606278783161442, "loss": 0.0123, "step": 94930 }, { "epoch": 1.03, "learning_rate": 0.00014604657196601154, "loss": 0.0107, "step": 94940 }, { "epoch": 1.03, "learning_rate": 0.00014603035610040864, "loss": 0.0134, "step": 94950 }, { "epoch": 1.03, "learning_rate": 0.00014601414023480573, "loss": 0.0105, "step": 94960 }, { "epoch": 1.03, "learning_rate": 0.00014599792436920282, "loss": 0.0105, "step": 94970 }, { "epoch": 1.03, "learning_rate": 0.00014598170850359992, "loss": 0.0093, "step": 94980 }, { "epoch": 1.03, "learning_rate": 0.000145965492637997, "loss": 0.0096, "step": 94990 }, { "epoch": 1.03, "learning_rate": 0.0001459492767723941, "loss": 0.0103, "step": 95000 }, { "epoch": 1.03, "eval_cer": 0.9215477809800273, "eval_loss": 0.009139502421021461, "eval_runtime": 121.5893, "eval_samples_per_second": 16.449, "eval_steps_per_second": 4.112, "step": 95000 }, { "epoch": 1.03, "learning_rate": 0.0001459330609067912, "loss": 0.01, "step": 95010 }, { "epoch": 1.03, "learning_rate": 0.0001459168450411883, "loss": 0.011, "step": 95020 }, { "epoch": 1.03, "learning_rate": 0.00014590062917558538, "loss": 0.0115, "step": 95030 }, { "epoch": 1.03, "learning_rate": 0.00014588441330998247, "loss": 0.0113, "step": 95040 }, { "epoch": 1.03, "learning_rate": 0.00014586819744437956, "loss": 0.012, "step": 95050 }, { "epoch": 1.03, "learning_rate": 0.00014585198157877666, "loss": 0.0116, "step": 95060 }, { "epoch": 1.03, "learning_rate": 0.00014583576571317375, "loss": 0.0096, "step": 95070 }, { "epoch": 1.03, "learning_rate": 0.00014581954984757084, "loss": 0.0095, "step": 95080 }, { "epoch": 1.03, "learning_rate": 0.00014580333398196796, "loss": 0.0094, "step": 95090 }, { "epoch": 1.03, "learning_rate": 0.00014578711811636503, "loss": 0.0111, "step": 95100 }, { "epoch": 1.03, "learning_rate": 0.00014577090225076215, "loss": 0.0114, "step": 95110 }, { "epoch": 1.03, "learning_rate": 0.00014575468638515921, "loss": 0.0097, "step": 95120 }, { "epoch": 1.03, "learning_rate": 0.00014573847051955633, "loss": 0.0115, "step": 95130 }, { "epoch": 1.03, "learning_rate": 0.0001457222546539534, "loss": 0.0114, "step": 95140 }, { "epoch": 1.03, "learning_rate": 0.00014570603878835052, "loss": 0.0136, "step": 95150 }, { "epoch": 1.03, "learning_rate": 0.0001456898229227476, "loss": 0.0105, "step": 95160 }, { "epoch": 1.03, "learning_rate": 0.0001456736070571447, "loss": 0.0092, "step": 95170 }, { "epoch": 1.03, "learning_rate": 0.0001456573911915418, "loss": 0.0091, "step": 95180 }, { "epoch": 1.03, "learning_rate": 0.0001456411753259389, "loss": 0.01, "step": 95190 }, { "epoch": 1.03, "learning_rate": 0.00014562495946033598, "loss": 0.0135, "step": 95200 }, { "epoch": 1.03, "learning_rate": 0.00014560874359473308, "loss": 0.013, "step": 95210 }, { "epoch": 1.03, "learning_rate": 0.00014559252772913017, "loss": 0.0127, "step": 95220 }, { "epoch": 1.03, "learning_rate": 0.00014557631186352726, "loss": 0.0115, "step": 95230 }, { "epoch": 1.03, "learning_rate": 0.00014556009599792435, "loss": 0.0119, "step": 95240 }, { "epoch": 1.03, "learning_rate": 0.00014554388013232145, "loss": 0.0115, "step": 95250 }, { "epoch": 1.03, "learning_rate": 0.00014552766426671854, "loss": 0.0102, "step": 95260 }, { "epoch": 1.03, "learning_rate": 0.00014551144840111563, "loss": 0.0123, "step": 95270 }, { "epoch": 1.03, "learning_rate": 0.00014549523253551273, "loss": 0.0125, "step": 95280 }, { "epoch": 1.03, "learning_rate": 0.00014547901666990984, "loss": 0.0105, "step": 95290 }, { "epoch": 1.03, "learning_rate": 0.0001454628008043069, "loss": 0.0116, "step": 95300 }, { "epoch": 1.03, "learning_rate": 0.00014544658493870403, "loss": 0.011, "step": 95310 }, { "epoch": 1.03, "learning_rate": 0.0001454303690731011, "loss": 0.0101, "step": 95320 }, { "epoch": 1.03, "learning_rate": 0.00014541415320749822, "loss": 0.0089, "step": 95330 }, { "epoch": 1.03, "learning_rate": 0.00014539793734189528, "loss": 0.0113, "step": 95340 }, { "epoch": 1.03, "learning_rate": 0.0001453817214762924, "loss": 0.0105, "step": 95350 }, { "epoch": 1.03, "learning_rate": 0.0001453655056106895, "loss": 0.0103, "step": 95360 }, { "epoch": 1.03, "learning_rate": 0.0001453492897450866, "loss": 0.0084, "step": 95370 }, { "epoch": 1.03, "learning_rate": 0.00014533307387948368, "loss": 0.0129, "step": 95380 }, { "epoch": 1.03, "learning_rate": 0.00014531685801388077, "loss": 0.0113, "step": 95390 }, { "epoch": 1.03, "learning_rate": 0.00014530064214827787, "loss": 0.0099, "step": 95400 }, { "epoch": 1.03, "learning_rate": 0.00014528442628267496, "loss": 0.013, "step": 95410 }, { "epoch": 1.03, "learning_rate": 0.00014526821041707205, "loss": 0.0091, "step": 95420 }, { "epoch": 1.03, "learning_rate": 0.00014525199455146914, "loss": 0.0105, "step": 95430 }, { "epoch": 1.03, "learning_rate": 0.00014523577868586624, "loss": 0.0111, "step": 95440 }, { "epoch": 1.03, "learning_rate": 0.00014521956282026333, "loss": 0.0098, "step": 95450 }, { "epoch": 1.03, "learning_rate": 0.00014520334695466042, "loss": 0.01, "step": 95460 }, { "epoch": 1.03, "learning_rate": 0.00014518713108905751, "loss": 0.0103, "step": 95470 }, { "epoch": 1.03, "learning_rate": 0.0001451709152234546, "loss": 0.0117, "step": 95480 }, { "epoch": 1.03, "learning_rate": 0.0001451546993578517, "loss": 0.0102, "step": 95490 }, { "epoch": 1.03, "learning_rate": 0.0001451384834922488, "loss": 0.0081, "step": 95500 }, { "epoch": 1.03, "learning_rate": 0.0001451222676266459, "loss": 0.0125, "step": 95510 }, { "epoch": 1.03, "learning_rate": 0.00014510605176104298, "loss": 0.0097, "step": 95520 }, { "epoch": 1.03, "learning_rate": 0.0001450898358954401, "loss": 0.0109, "step": 95530 }, { "epoch": 1.03, "learning_rate": 0.00014507362002983716, "loss": 0.0114, "step": 95540 }, { "epoch": 1.03, "learning_rate": 0.00014505740416423428, "loss": 0.0108, "step": 95550 }, { "epoch": 1.03, "learning_rate": 0.00014504118829863135, "loss": 0.0112, "step": 95560 }, { "epoch": 1.03, "learning_rate": 0.00014502497243302847, "loss": 0.0096, "step": 95570 }, { "epoch": 1.03, "learning_rate": 0.00014500875656742556, "loss": 0.0108, "step": 95580 }, { "epoch": 1.03, "learning_rate": 0.00014499254070182265, "loss": 0.0123, "step": 95590 }, { "epoch": 1.03, "learning_rate": 0.00014497632483621975, "loss": 0.0084, "step": 95600 }, { "epoch": 1.03, "learning_rate": 0.00014496010897061684, "loss": 0.0124, "step": 95610 }, { "epoch": 1.03, "learning_rate": 0.00014494389310501393, "loss": 0.0104, "step": 95620 }, { "epoch": 1.03, "learning_rate": 0.00014492767723941103, "loss": 0.0116, "step": 95630 }, { "epoch": 1.03, "learning_rate": 0.00014491146137380812, "loss": 0.012, "step": 95640 }, { "epoch": 1.03, "learning_rate": 0.0001448952455082052, "loss": 0.0108, "step": 95650 }, { "epoch": 1.03, "learning_rate": 0.0001448790296426023, "loss": 0.0128, "step": 95660 }, { "epoch": 1.03, "learning_rate": 0.0001448628137769994, "loss": 0.0146, "step": 95670 }, { "epoch": 1.03, "learning_rate": 0.00014484659791139652, "loss": 0.012, "step": 95680 }, { "epoch": 1.03, "learning_rate": 0.00014483038204579358, "loss": 0.0081, "step": 95690 }, { "epoch": 1.03, "learning_rate": 0.0001448141661801907, "loss": 0.0081, "step": 95700 }, { "epoch": 1.03, "learning_rate": 0.00014479795031458777, "loss": 0.0096, "step": 95710 }, { "epoch": 1.03, "learning_rate": 0.0001447817344489849, "loss": 0.0102, "step": 95720 }, { "epoch": 1.03, "learning_rate": 0.00014476551858338198, "loss": 0.0097, "step": 95730 }, { "epoch": 1.03, "learning_rate": 0.00014474930271777907, "loss": 0.01, "step": 95740 }, { "epoch": 1.04, "learning_rate": 0.00014473308685217617, "loss": 0.0086, "step": 95750 }, { "epoch": 1.04, "learning_rate": 0.00014471687098657326, "loss": 0.0096, "step": 95760 }, { "epoch": 1.04, "learning_rate": 0.00014470065512097035, "loss": 0.0103, "step": 95770 }, { "epoch": 1.04, "learning_rate": 0.00014468443925536744, "loss": 0.0092, "step": 95780 }, { "epoch": 1.04, "learning_rate": 0.00014466822338976454, "loss": 0.0102, "step": 95790 }, { "epoch": 1.04, "learning_rate": 0.00014465200752416163, "loss": 0.0111, "step": 95800 }, { "epoch": 1.04, "learning_rate": 0.00014463579165855872, "loss": 0.0139, "step": 95810 }, { "epoch": 1.04, "learning_rate": 0.00014461957579295581, "loss": 0.0103, "step": 95820 }, { "epoch": 1.04, "learning_rate": 0.0001446033599273529, "loss": 0.0115, "step": 95830 }, { "epoch": 1.04, "learning_rate": 0.00014458714406175, "loss": 0.0089, "step": 95840 }, { "epoch": 1.04, "learning_rate": 0.0001445709281961471, "loss": 0.0104, "step": 95850 }, { "epoch": 1.04, "learning_rate": 0.00014455471233054419, "loss": 0.0112, "step": 95860 }, { "epoch": 1.04, "learning_rate": 0.00014453849646494128, "loss": 0.007, "step": 95870 }, { "epoch": 1.04, "learning_rate": 0.0001445222805993384, "loss": 0.0119, "step": 95880 }, { "epoch": 1.04, "learning_rate": 0.00014450606473373546, "loss": 0.0101, "step": 95890 }, { "epoch": 1.04, "learning_rate": 0.00014448984886813258, "loss": 0.0113, "step": 95900 }, { "epoch": 1.04, "learning_rate": 0.00014447363300252965, "loss": 0.015, "step": 95910 }, { "epoch": 1.04, "learning_rate": 0.00014445741713692677, "loss": 0.014, "step": 95920 }, { "epoch": 1.04, "learning_rate": 0.00014444120127132383, "loss": 0.0115, "step": 95930 }, { "epoch": 1.04, "learning_rate": 0.00014442498540572095, "loss": 0.0098, "step": 95940 }, { "epoch": 1.04, "learning_rate": 0.00014440876954011805, "loss": 0.0112, "step": 95950 }, { "epoch": 1.04, "learning_rate": 0.00014439255367451514, "loss": 0.0104, "step": 95960 }, { "epoch": 1.04, "learning_rate": 0.00014437633780891223, "loss": 0.0122, "step": 95970 }, { "epoch": 1.04, "learning_rate": 0.00014436012194330933, "loss": 0.0097, "step": 95980 }, { "epoch": 1.04, "learning_rate": 0.00014434390607770642, "loss": 0.0094, "step": 95990 }, { "epoch": 1.04, "learning_rate": 0.0001443276902121035, "loss": 0.0107, "step": 96000 }, { "epoch": 1.04, "eval_cer": 0.9215503867888964, "eval_loss": 0.008839464746415615, "eval_runtime": 121.6744, "eval_samples_per_second": 16.437, "eval_steps_per_second": 4.109, "step": 96000 }, { "epoch": 1.04, "learning_rate": 0.0001443114743465006, "loss": 0.0106, "step": 96010 }, { "epoch": 1.04, "learning_rate": 0.0001442952584808977, "loss": 0.0109, "step": 96020 }, { "epoch": 1.04, "learning_rate": 0.0001442790426152948, "loss": 0.0094, "step": 96030 }, { "epoch": 1.04, "learning_rate": 0.00014426282674969188, "loss": 0.0114, "step": 96040 }, { "epoch": 1.04, "learning_rate": 0.00014424661088408897, "loss": 0.0102, "step": 96050 }, { "epoch": 1.04, "learning_rate": 0.00014423039501848607, "loss": 0.0106, "step": 96060 }, { "epoch": 1.04, "learning_rate": 0.00014421417915288316, "loss": 0.0083, "step": 96070 }, { "epoch": 1.04, "learning_rate": 0.00014419796328728025, "loss": 0.0118, "step": 96080 }, { "epoch": 1.04, "learning_rate": 0.00014418174742167735, "loss": 0.0098, "step": 96090 }, { "epoch": 1.04, "learning_rate": 0.00014416553155607447, "loss": 0.0147, "step": 96100 }, { "epoch": 1.04, "learning_rate": 0.00014414931569047153, "loss": 0.0123, "step": 96110 }, { "epoch": 1.04, "learning_rate": 0.00014413309982486865, "loss": 0.0113, "step": 96120 }, { "epoch": 1.04, "learning_rate": 0.00014411688395926572, "loss": 0.0105, "step": 96130 }, { "epoch": 1.04, "learning_rate": 0.00014410066809366284, "loss": 0.0119, "step": 96140 }, { "epoch": 1.04, "learning_rate": 0.0001440844522280599, "loss": 0.0094, "step": 96150 }, { "epoch": 1.04, "learning_rate": 0.00014406823636245702, "loss": 0.0127, "step": 96160 }, { "epoch": 1.04, "learning_rate": 0.00014405202049685411, "loss": 0.0104, "step": 96170 }, { "epoch": 1.04, "learning_rate": 0.0001440358046312512, "loss": 0.0095, "step": 96180 }, { "epoch": 1.04, "learning_rate": 0.0001440195887656483, "loss": 0.0082, "step": 96190 }, { "epoch": 1.04, "learning_rate": 0.0001440033729000454, "loss": 0.0129, "step": 96200 }, { "epoch": 1.04, "learning_rate": 0.00014398715703444249, "loss": 0.0105, "step": 96210 }, { "epoch": 1.04, "learning_rate": 0.00014397094116883958, "loss": 0.0094, "step": 96220 }, { "epoch": 1.04, "learning_rate": 0.00014395472530323667, "loss": 0.0094, "step": 96230 }, { "epoch": 1.04, "learning_rate": 0.00014393850943763376, "loss": 0.0132, "step": 96240 }, { "epoch": 1.04, "learning_rate": 0.00014392229357203086, "loss": 0.0114, "step": 96250 }, { "epoch": 1.04, "learning_rate": 0.00014390607770642795, "loss": 0.0138, "step": 96260 }, { "epoch": 1.04, "learning_rate": 0.00014388986184082504, "loss": 0.0117, "step": 96270 }, { "epoch": 1.04, "learning_rate": 0.00014387364597522213, "loss": 0.0126, "step": 96280 }, { "epoch": 1.04, "learning_rate": 0.00014385743010961923, "loss": 0.0106, "step": 96290 }, { "epoch": 1.04, "learning_rate": 0.00014384121424401635, "loss": 0.0116, "step": 96300 }, { "epoch": 1.04, "learning_rate": 0.0001438249983784134, "loss": 0.0116, "step": 96310 }, { "epoch": 1.04, "learning_rate": 0.00014380878251281053, "loss": 0.0108, "step": 96320 }, { "epoch": 1.04, "learning_rate": 0.0001437925666472076, "loss": 0.0092, "step": 96330 }, { "epoch": 1.04, "learning_rate": 0.00014377635078160472, "loss": 0.0122, "step": 96340 }, { "epoch": 1.04, "learning_rate": 0.00014376013491600178, "loss": 0.0089, "step": 96350 }, { "epoch": 1.04, "learning_rate": 0.0001437439190503989, "loss": 0.0114, "step": 96360 }, { "epoch": 1.04, "learning_rate": 0.000143727703184796, "loss": 0.0124, "step": 96370 }, { "epoch": 1.04, "learning_rate": 0.0001437114873191931, "loss": 0.013, "step": 96380 }, { "epoch": 1.04, "learning_rate": 0.00014369527145359018, "loss": 0.0108, "step": 96390 }, { "epoch": 1.04, "learning_rate": 0.00014367905558798727, "loss": 0.0126, "step": 96400 }, { "epoch": 1.04, "learning_rate": 0.00014366283972238437, "loss": 0.0121, "step": 96410 }, { "epoch": 1.04, "learning_rate": 0.00014364662385678146, "loss": 0.0118, "step": 96420 }, { "epoch": 1.04, "learning_rate": 0.00014363040799117855, "loss": 0.0091, "step": 96430 }, { "epoch": 1.04, "learning_rate": 0.00014361419212557565, "loss": 0.011, "step": 96440 }, { "epoch": 1.04, "learning_rate": 0.00014359797625997277, "loss": 0.0111, "step": 96450 }, { "epoch": 1.04, "learning_rate": 0.00014358176039436983, "loss": 0.0097, "step": 96460 }, { "epoch": 1.04, "learning_rate": 0.00014356554452876695, "loss": 0.0101, "step": 96470 }, { "epoch": 1.04, "learning_rate": 0.00014354932866316402, "loss": 0.0113, "step": 96480 }, { "epoch": 1.04, "learning_rate": 0.00014353311279756114, "loss": 0.0098, "step": 96490 }, { "epoch": 1.04, "learning_rate": 0.0001435168969319582, "loss": 0.011, "step": 96500 }, { "epoch": 1.04, "learning_rate": 0.00014350068106635532, "loss": 0.0106, "step": 96510 }, { "epoch": 1.04, "learning_rate": 0.00014348446520075241, "loss": 0.0104, "step": 96520 }, { "epoch": 1.04, "learning_rate": 0.0001434682493351495, "loss": 0.01, "step": 96530 }, { "epoch": 1.04, "learning_rate": 0.0001434520334695466, "loss": 0.0111, "step": 96540 }, { "epoch": 1.04, "learning_rate": 0.0001434358176039437, "loss": 0.0133, "step": 96550 }, { "epoch": 1.04, "learning_rate": 0.00014341960173834079, "loss": 0.0093, "step": 96560 }, { "epoch": 1.04, "learning_rate": 0.00014340338587273788, "loss": 0.0114, "step": 96570 }, { "epoch": 1.04, "learning_rate": 0.00014338717000713497, "loss": 0.0107, "step": 96580 }, { "epoch": 1.04, "learning_rate": 0.00014337095414153206, "loss": 0.0107, "step": 96590 }, { "epoch": 1.04, "learning_rate": 0.00014335473827592916, "loss": 0.0092, "step": 96600 }, { "epoch": 1.04, "learning_rate": 0.00014333852241032625, "loss": 0.0095, "step": 96610 }, { "epoch": 1.04, "learning_rate": 0.00014332230654472334, "loss": 0.012, "step": 96620 }, { "epoch": 1.04, "learning_rate": 0.00014330609067912044, "loss": 0.0142, "step": 96630 }, { "epoch": 1.04, "learning_rate": 0.00014328987481351753, "loss": 0.0132, "step": 96640 }, { "epoch": 1.04, "learning_rate": 0.00014327365894791462, "loss": 0.0085, "step": 96650 }, { "epoch": 1.04, "learning_rate": 0.0001432574430823117, "loss": 0.0098, "step": 96660 }, { "epoch": 1.05, "learning_rate": 0.00014324122721670883, "loss": 0.0111, "step": 96670 }, { "epoch": 1.05, "learning_rate": 0.0001432250113511059, "loss": 0.0121, "step": 96680 }, { "epoch": 1.05, "learning_rate": 0.00014320879548550302, "loss": 0.0092, "step": 96690 }, { "epoch": 1.05, "learning_rate": 0.00014319257961990008, "loss": 0.0096, "step": 96700 }, { "epoch": 1.05, "learning_rate": 0.0001431763637542972, "loss": 0.0095, "step": 96710 }, { "epoch": 1.05, "learning_rate": 0.00014316014788869427, "loss": 0.0083, "step": 96720 }, { "epoch": 1.05, "learning_rate": 0.0001431439320230914, "loss": 0.0092, "step": 96730 }, { "epoch": 1.05, "learning_rate": 0.00014312771615748848, "loss": 0.0107, "step": 96740 }, { "epoch": 1.05, "learning_rate": 0.00014311150029188558, "loss": 0.0108, "step": 96750 }, { "epoch": 1.05, "learning_rate": 0.00014309528442628267, "loss": 0.0091, "step": 96760 }, { "epoch": 1.05, "learning_rate": 0.00014307906856067976, "loss": 0.0105, "step": 96770 }, { "epoch": 1.05, "learning_rate": 0.00014306285269507685, "loss": 0.0118, "step": 96780 }, { "epoch": 1.05, "learning_rate": 0.00014304663682947395, "loss": 0.0094, "step": 96790 }, { "epoch": 1.05, "learning_rate": 0.00014303042096387104, "loss": 0.0087, "step": 96800 }, { "epoch": 1.05, "learning_rate": 0.00014301420509826813, "loss": 0.0101, "step": 96810 }, { "epoch": 1.05, "learning_rate": 0.00014299798923266522, "loss": 0.0107, "step": 96820 }, { "epoch": 1.05, "learning_rate": 0.00014298177336706232, "loss": 0.0109, "step": 96830 }, { "epoch": 1.05, "learning_rate": 0.0001429655575014594, "loss": 0.0134, "step": 96840 }, { "epoch": 1.05, "learning_rate": 0.0001429493416358565, "loss": 0.0107, "step": 96850 }, { "epoch": 1.05, "learning_rate": 0.0001429331257702536, "loss": 0.0115, "step": 96860 }, { "epoch": 1.05, "learning_rate": 0.0001429169099046507, "loss": 0.0131, "step": 96870 }, { "epoch": 1.05, "learning_rate": 0.00014290069403904778, "loss": 0.0098, "step": 96880 }, { "epoch": 1.05, "learning_rate": 0.0001428844781734449, "loss": 0.0078, "step": 96890 }, { "epoch": 1.05, "learning_rate": 0.00014286826230784197, "loss": 0.0108, "step": 96900 }, { "epoch": 1.05, "learning_rate": 0.00014285204644223909, "loss": 0.0086, "step": 96910 }, { "epoch": 1.05, "learning_rate": 0.00014283583057663615, "loss": 0.0105, "step": 96920 }, { "epoch": 1.05, "learning_rate": 0.00014281961471103327, "loss": 0.0126, "step": 96930 }, { "epoch": 1.05, "learning_rate": 0.00014280339884543034, "loss": 0.0113, "step": 96940 }, { "epoch": 1.05, "learning_rate": 0.00014278718297982746, "loss": 0.011, "step": 96950 }, { "epoch": 1.05, "learning_rate": 0.00014277096711422455, "loss": 0.0111, "step": 96960 }, { "epoch": 1.05, "learning_rate": 0.00014275475124862164, "loss": 0.0101, "step": 96970 }, { "epoch": 1.05, "learning_rate": 0.00014273853538301874, "loss": 0.0104, "step": 96980 }, { "epoch": 1.05, "learning_rate": 0.00014272231951741583, "loss": 0.0096, "step": 96990 }, { "epoch": 1.05, "learning_rate": 0.00014270610365181292, "loss": 0.0109, "step": 97000 }, { "epoch": 1.05, "eval_cer": 0.9215321461268126, "eval_loss": 0.008719232864677906, "eval_runtime": 121.1881, "eval_samples_per_second": 16.503, "eval_steps_per_second": 4.126, "step": 97000 }, { "epoch": 1.05, "learning_rate": 0.00014268988778621001, "loss": 0.0101, "step": 97010 }, { "epoch": 1.05, "learning_rate": 0.0001426736719206071, "loss": 0.0122, "step": 97020 }, { "epoch": 1.05, "learning_rate": 0.0001426574560550042, "loss": 0.0153, "step": 97030 }, { "epoch": 1.05, "learning_rate": 0.0001426412401894013, "loss": 0.0102, "step": 97040 }, { "epoch": 1.05, "learning_rate": 0.00014262502432379838, "loss": 0.0113, "step": 97050 }, { "epoch": 1.05, "learning_rate": 0.00014260880845819548, "loss": 0.0101, "step": 97060 }, { "epoch": 1.05, "learning_rate": 0.00014259259259259257, "loss": 0.0114, "step": 97070 }, { "epoch": 1.05, "learning_rate": 0.00014257637672698966, "loss": 0.0105, "step": 97080 }, { "epoch": 1.05, "learning_rate": 0.00014256016086138676, "loss": 0.0097, "step": 97090 }, { "epoch": 1.05, "learning_rate": 0.00014254394499578385, "loss": 0.0104, "step": 97100 }, { "epoch": 1.05, "learning_rate": 0.00014252772913018097, "loss": 0.009, "step": 97110 }, { "epoch": 1.05, "learning_rate": 0.00014251151326457806, "loss": 0.0111, "step": 97120 }, { "epoch": 1.05, "learning_rate": 0.00014249529739897515, "loss": 0.0093, "step": 97130 }, { "epoch": 1.05, "learning_rate": 0.00014247908153337225, "loss": 0.0098, "step": 97140 }, { "epoch": 1.05, "learning_rate": 0.00014246286566776934, "loss": 0.0151, "step": 97150 }, { "epoch": 1.05, "learning_rate": 0.00014244664980216643, "loss": 0.0103, "step": 97160 }, { "epoch": 1.05, "learning_rate": 0.00014243043393656352, "loss": 0.0143, "step": 97170 }, { "epoch": 1.05, "learning_rate": 0.00014241421807096062, "loss": 0.0144, "step": 97180 }, { "epoch": 1.05, "learning_rate": 0.0001423980022053577, "loss": 0.0107, "step": 97190 }, { "epoch": 1.05, "learning_rate": 0.0001423817863397548, "loss": 0.0094, "step": 97200 }, { "epoch": 1.05, "learning_rate": 0.0001423655704741519, "loss": 0.0106, "step": 97210 }, { "epoch": 1.05, "learning_rate": 0.000142349354608549, "loss": 0.0096, "step": 97220 }, { "epoch": 1.05, "learning_rate": 0.00014233313874294608, "loss": 0.0102, "step": 97230 }, { "epoch": 1.05, "learning_rate": 0.00014231692287734317, "loss": 0.0088, "step": 97240 }, { "epoch": 1.05, "learning_rate": 0.00014230070701174027, "loss": 0.0124, "step": 97250 }, { "epoch": 1.05, "learning_rate": 0.00014228449114613739, "loss": 0.0111, "step": 97260 }, { "epoch": 1.05, "learning_rate": 0.00014226827528053445, "loss": 0.0115, "step": 97270 }, { "epoch": 1.05, "learning_rate": 0.00014225205941493157, "loss": 0.0088, "step": 97280 }, { "epoch": 1.05, "learning_rate": 0.00014223584354932864, "loss": 0.0134, "step": 97290 }, { "epoch": 1.05, "learning_rate": 0.00014221962768372576, "loss": 0.0114, "step": 97300 }, { "epoch": 1.05, "learning_rate": 0.00014220341181812285, "loss": 0.0101, "step": 97310 }, { "epoch": 1.05, "learning_rate": 0.00014218719595251994, "loss": 0.0118, "step": 97320 }, { "epoch": 1.05, "learning_rate": 0.00014217098008691704, "loss": 0.0096, "step": 97330 }, { "epoch": 1.05, "learning_rate": 0.00014215476422131413, "loss": 0.0082, "step": 97340 }, { "epoch": 1.05, "learning_rate": 0.00014213854835571122, "loss": 0.0101, "step": 97350 }, { "epoch": 1.05, "learning_rate": 0.00014212233249010831, "loss": 0.01, "step": 97360 }, { "epoch": 1.05, "learning_rate": 0.0001421061166245054, "loss": 0.0095, "step": 97370 }, { "epoch": 1.05, "learning_rate": 0.0001420899007589025, "loss": 0.01, "step": 97380 }, { "epoch": 1.05, "learning_rate": 0.0001420736848932996, "loss": 0.0118, "step": 97390 }, { "epoch": 1.05, "learning_rate": 0.00014205746902769668, "loss": 0.0092, "step": 97400 }, { "epoch": 1.05, "learning_rate": 0.00014204125316209378, "loss": 0.0089, "step": 97410 }, { "epoch": 1.05, "learning_rate": 0.00014202503729649087, "loss": 0.0125, "step": 97420 }, { "epoch": 1.05, "learning_rate": 0.00014200882143088796, "loss": 0.0132, "step": 97430 }, { "epoch": 1.05, "learning_rate": 0.00014199260556528506, "loss": 0.0132, "step": 97440 }, { "epoch": 1.05, "learning_rate": 0.00014197638969968215, "loss": 0.0127, "step": 97450 }, { "epoch": 1.05, "learning_rate": 0.00014196017383407927, "loss": 0.0116, "step": 97460 }, { "epoch": 1.05, "learning_rate": 0.00014194395796847633, "loss": 0.0108, "step": 97470 }, { "epoch": 1.05, "learning_rate": 0.00014192774210287345, "loss": 0.0107, "step": 97480 }, { "epoch": 1.05, "learning_rate": 0.00014191152623727052, "loss": 0.0098, "step": 97490 }, { "epoch": 1.05, "learning_rate": 0.00014189531037166764, "loss": 0.0101, "step": 97500 }, { "epoch": 1.05, "learning_rate": 0.0001418790945060647, "loss": 0.0107, "step": 97510 }, { "epoch": 1.05, "learning_rate": 0.00014186287864046182, "loss": 0.011, "step": 97520 }, { "epoch": 1.05, "learning_rate": 0.00014184666277485892, "loss": 0.0108, "step": 97530 }, { "epoch": 1.05, "learning_rate": 0.000141830446909256, "loss": 0.0118, "step": 97540 }, { "epoch": 1.05, "learning_rate": 0.0001418142310436531, "loss": 0.0111, "step": 97550 }, { "epoch": 1.05, "learning_rate": 0.0001417980151780502, "loss": 0.0091, "step": 97560 }, { "epoch": 1.05, "learning_rate": 0.0001417817993124473, "loss": 0.0097, "step": 97570 }, { "epoch": 1.05, "learning_rate": 0.00014176558344684438, "loss": 0.0102, "step": 97580 }, { "epoch": 1.05, "learning_rate": 0.00014174936758124147, "loss": 0.0107, "step": 97590 }, { "epoch": 1.06, "learning_rate": 0.00014173315171563857, "loss": 0.0112, "step": 97600 }, { "epoch": 1.06, "learning_rate": 0.00014171693585003566, "loss": 0.0116, "step": 97610 }, { "epoch": 1.06, "learning_rate": 0.00014170071998443275, "loss": 0.0098, "step": 97620 }, { "epoch": 1.06, "learning_rate": 0.00014168450411882985, "loss": 0.0082, "step": 97630 }, { "epoch": 1.06, "learning_rate": 0.00014166828825322694, "loss": 0.0118, "step": 97640 }, { "epoch": 1.06, "learning_rate": 0.00014165207238762403, "loss": 0.008, "step": 97650 }, { "epoch": 1.06, "learning_rate": 0.00014163585652202112, "loss": 0.0114, "step": 97660 }, { "epoch": 1.06, "learning_rate": 0.00014161964065641822, "loss": 0.0114, "step": 97670 }, { "epoch": 1.06, "learning_rate": 0.00014160342479081534, "loss": 0.0128, "step": 97680 }, { "epoch": 1.06, "learning_rate": 0.0001415872089252124, "loss": 0.0089, "step": 97690 }, { "epoch": 1.06, "learning_rate": 0.00014157099305960952, "loss": 0.0109, "step": 97700 }, { "epoch": 1.06, "learning_rate": 0.0001415547771940066, "loss": 0.0095, "step": 97710 }, { "epoch": 1.06, "learning_rate": 0.0001415385613284037, "loss": 0.0093, "step": 97720 }, { "epoch": 1.06, "learning_rate": 0.00014152234546280077, "loss": 0.012, "step": 97730 }, { "epoch": 1.06, "learning_rate": 0.0001415061295971979, "loss": 0.0119, "step": 97740 }, { "epoch": 1.06, "learning_rate": 0.00014148991373159499, "loss": 0.0105, "step": 97750 }, { "epoch": 1.06, "learning_rate": 0.00014147369786599208, "loss": 0.0091, "step": 97760 }, { "epoch": 1.06, "learning_rate": 0.00014145748200038917, "loss": 0.0078, "step": 97770 }, { "epoch": 1.06, "learning_rate": 0.00014144126613478626, "loss": 0.0089, "step": 97780 }, { "epoch": 1.06, "learning_rate": 0.00014142505026918336, "loss": 0.0113, "step": 97790 }, { "epoch": 1.06, "learning_rate": 0.00014140883440358045, "loss": 0.0105, "step": 97800 }, { "epoch": 1.06, "learning_rate": 0.00014139261853797754, "loss": 0.0106, "step": 97810 }, { "epoch": 1.06, "learning_rate": 0.00014137640267237463, "loss": 0.0104, "step": 97820 }, { "epoch": 1.06, "learning_rate": 0.00014136018680677175, "loss": 0.0096, "step": 97830 }, { "epoch": 1.06, "learning_rate": 0.00014134397094116882, "loss": 0.0104, "step": 97840 }, { "epoch": 1.06, "learning_rate": 0.00014132775507556594, "loss": 0.01, "step": 97850 }, { "epoch": 1.06, "learning_rate": 0.000141311539209963, "loss": 0.0101, "step": 97860 }, { "epoch": 1.06, "learning_rate": 0.00014129532334436013, "loss": 0.0112, "step": 97870 }, { "epoch": 1.06, "learning_rate": 0.0001412791074787572, "loss": 0.0103, "step": 97880 }, { "epoch": 1.06, "learning_rate": 0.0001412628916131543, "loss": 0.0114, "step": 97890 }, { "epoch": 1.06, "learning_rate": 0.0001412466757475514, "loss": 0.0124, "step": 97900 }, { "epoch": 1.06, "learning_rate": 0.0001412304598819485, "loss": 0.0074, "step": 97910 }, { "epoch": 1.06, "learning_rate": 0.0001412142440163456, "loss": 0.0093, "step": 97920 }, { "epoch": 1.06, "learning_rate": 0.00014119802815074268, "loss": 0.0096, "step": 97930 }, { "epoch": 1.06, "learning_rate": 0.00014118181228513977, "loss": 0.0101, "step": 97940 }, { "epoch": 1.06, "learning_rate": 0.00014116559641953687, "loss": 0.0117, "step": 97950 }, { "epoch": 1.06, "learning_rate": 0.00014114938055393396, "loss": 0.011, "step": 97960 }, { "epoch": 1.06, "learning_rate": 0.00014113316468833105, "loss": 0.0117, "step": 97970 }, { "epoch": 1.06, "learning_rate": 0.00014111694882272815, "loss": 0.0098, "step": 97980 }, { "epoch": 1.06, "learning_rate": 0.00014110073295712524, "loss": 0.0099, "step": 97990 }, { "epoch": 1.06, "learning_rate": 0.00014108451709152233, "loss": 0.0102, "step": 98000 }, { "epoch": 1.06, "eval_cer": 0.9215616786273294, "eval_loss": 0.008956007659435272, "eval_runtime": 121.1479, "eval_samples_per_second": 16.509, "eval_steps_per_second": 4.127, "step": 98000 }, { "epoch": 1.06, "learning_rate": 0.00014106830122591942, "loss": 0.0108, "step": 98010 }, { "epoch": 1.06, "learning_rate": 0.00014105208536031652, "loss": 0.0076, "step": 98020 }, { "epoch": 1.06, "learning_rate": 0.0001410358694947136, "loss": 0.0092, "step": 98030 }, { "epoch": 1.06, "learning_rate": 0.0001410196536291107, "loss": 0.0089, "step": 98040 }, { "epoch": 1.06, "learning_rate": 0.00014100343776350782, "loss": 0.0126, "step": 98050 }, { "epoch": 1.06, "learning_rate": 0.0001409872218979049, "loss": 0.0102, "step": 98060 }, { "epoch": 1.06, "learning_rate": 0.000140971006032302, "loss": 0.0111, "step": 98070 }, { "epoch": 1.06, "learning_rate": 0.00014095479016669907, "loss": 0.0099, "step": 98080 }, { "epoch": 1.06, "learning_rate": 0.0001409385743010962, "loss": 0.0105, "step": 98090 }, { "epoch": 1.06, "learning_rate": 0.00014092235843549326, "loss": 0.009, "step": 98100 }, { "epoch": 1.06, "learning_rate": 0.00014090614256989038, "loss": 0.0098, "step": 98110 }, { "epoch": 1.06, "learning_rate": 0.00014088992670428747, "loss": 0.0098, "step": 98120 }, { "epoch": 1.06, "learning_rate": 0.00014087371083868456, "loss": 0.0115, "step": 98130 }, { "epoch": 1.06, "learning_rate": 0.00014085749497308166, "loss": 0.0105, "step": 98140 }, { "epoch": 1.06, "learning_rate": 0.00014084127910747875, "loss": 0.0082, "step": 98150 }, { "epoch": 1.06, "learning_rate": 0.00014082506324187584, "loss": 0.0133, "step": 98160 }, { "epoch": 1.06, "learning_rate": 0.00014080884737627293, "loss": 0.0093, "step": 98170 }, { "epoch": 1.06, "learning_rate": 0.00014079263151067003, "loss": 0.0114, "step": 98180 }, { "epoch": 1.06, "learning_rate": 0.00014077641564506712, "loss": 0.0087, "step": 98190 }, { "epoch": 1.06, "learning_rate": 0.0001407601997794642, "loss": 0.0125, "step": 98200 }, { "epoch": 1.06, "learning_rate": 0.0001407439839138613, "loss": 0.0127, "step": 98210 }, { "epoch": 1.06, "learning_rate": 0.0001407277680482584, "loss": 0.0099, "step": 98220 }, { "epoch": 1.06, "learning_rate": 0.0001407115521826555, "loss": 0.0089, "step": 98230 }, { "epoch": 1.06, "learning_rate": 0.00014069533631705258, "loss": 0.0084, "step": 98240 }, { "epoch": 1.06, "learning_rate": 0.00014067912045144968, "loss": 0.0085, "step": 98250 }, { "epoch": 1.06, "learning_rate": 0.00014066290458584677, "loss": 0.0092, "step": 98260 }, { "epoch": 1.06, "learning_rate": 0.0001406466887202439, "loss": 0.0099, "step": 98270 }, { "epoch": 1.06, "learning_rate": 0.00014063047285464095, "loss": 0.0118, "step": 98280 }, { "epoch": 1.06, "learning_rate": 0.00014061425698903807, "loss": 0.0086, "step": 98290 }, { "epoch": 1.06, "learning_rate": 0.00014059804112343514, "loss": 0.0093, "step": 98300 }, { "epoch": 1.06, "learning_rate": 0.00014058182525783226, "loss": 0.0105, "step": 98310 }, { "epoch": 1.06, "learning_rate": 0.00014056560939222933, "loss": 0.0107, "step": 98320 }, { "epoch": 1.06, "learning_rate": 0.00014054939352662645, "loss": 0.0107, "step": 98330 }, { "epoch": 1.06, "learning_rate": 0.00014053317766102354, "loss": 0.0112, "step": 98340 }, { "epoch": 1.06, "learning_rate": 0.00014051696179542063, "loss": 0.0148, "step": 98350 }, { "epoch": 1.06, "learning_rate": 0.00014050074592981772, "loss": 0.0129, "step": 98360 }, { "epoch": 1.06, "learning_rate": 0.00014048453006421482, "loss": 0.0123, "step": 98370 }, { "epoch": 1.06, "learning_rate": 0.0001404683141986119, "loss": 0.0108, "step": 98380 }, { "epoch": 1.06, "learning_rate": 0.000140452098333009, "loss": 0.0129, "step": 98390 }, { "epoch": 1.06, "learning_rate": 0.0001404358824674061, "loss": 0.0128, "step": 98400 }, { "epoch": 1.06, "learning_rate": 0.0001404196666018032, "loss": 0.0096, "step": 98410 }, { "epoch": 1.06, "learning_rate": 0.00014040345073620028, "loss": 0.0147, "step": 98420 }, { "epoch": 1.06, "learning_rate": 0.00014038723487059737, "loss": 0.0108, "step": 98430 }, { "epoch": 1.06, "learning_rate": 0.00014037101900499447, "loss": 0.0148, "step": 98440 }, { "epoch": 1.06, "learning_rate": 0.00014035480313939156, "loss": 0.014, "step": 98450 }, { "epoch": 1.06, "learning_rate": 0.00014033858727378865, "loss": 0.0088, "step": 98460 }, { "epoch": 1.06, "learning_rate": 0.00014032237140818577, "loss": 0.0099, "step": 98470 }, { "epoch": 1.06, "learning_rate": 0.00014030615554258284, "loss": 0.0095, "step": 98480 }, { "epoch": 1.06, "learning_rate": 0.00014028993967697996, "loss": 0.0109, "step": 98490 }, { "epoch": 1.06, "learning_rate": 0.00014027372381137702, "loss": 0.0112, "step": 98500 }, { "epoch": 1.06, "learning_rate": 0.00014025750794577414, "loss": 0.009, "step": 98510 }, { "epoch": 1.07, "learning_rate": 0.0001402412920801712, "loss": 0.0086, "step": 98520 }, { "epoch": 1.07, "learning_rate": 0.00014022507621456833, "loss": 0.0107, "step": 98530 }, { "epoch": 1.07, "learning_rate": 0.00014020886034896542, "loss": 0.01, "step": 98540 }, { "epoch": 1.07, "learning_rate": 0.0001401926444833625, "loss": 0.0132, "step": 98550 }, { "epoch": 1.07, "learning_rate": 0.0001401764286177596, "loss": 0.01, "step": 98560 }, { "epoch": 1.07, "learning_rate": 0.0001401602127521567, "loss": 0.0093, "step": 98570 }, { "epoch": 1.07, "learning_rate": 0.0001401439968865538, "loss": 0.0112, "step": 98580 }, { "epoch": 1.07, "learning_rate": 0.00014012778102095088, "loss": 0.0103, "step": 98590 }, { "epoch": 1.07, "learning_rate": 0.00014011156515534798, "loss": 0.013, "step": 98600 }, { "epoch": 1.07, "learning_rate": 0.00014009534928974507, "loss": 0.0132, "step": 98610 }, { "epoch": 1.07, "learning_rate": 0.0001400791334241422, "loss": 0.0089, "step": 98620 }, { "epoch": 1.07, "learning_rate": 0.00014006291755853925, "loss": 0.0108, "step": 98630 }, { "epoch": 1.07, "learning_rate": 0.00014004670169293637, "loss": 0.0114, "step": 98640 }, { "epoch": 1.07, "learning_rate": 0.00014003048582733344, "loss": 0.0108, "step": 98650 }, { "epoch": 1.07, "learning_rate": 0.00014001426996173056, "loss": 0.0095, "step": 98660 }, { "epoch": 1.07, "learning_rate": 0.00013999805409612763, "loss": 0.0105, "step": 98670 }, { "epoch": 1.07, "learning_rate": 0.00013998183823052475, "loss": 0.0126, "step": 98680 }, { "epoch": 1.07, "learning_rate": 0.00013996562236492184, "loss": 0.0108, "step": 98690 }, { "epoch": 1.07, "learning_rate": 0.00013994940649931893, "loss": 0.0118, "step": 98700 }, { "epoch": 1.07, "learning_rate": 0.00013993319063371602, "loss": 0.0117, "step": 98710 }, { "epoch": 1.07, "learning_rate": 0.00013991697476811312, "loss": 0.0105, "step": 98720 }, { "epoch": 1.07, "learning_rate": 0.0001399007589025102, "loss": 0.0137, "step": 98730 }, { "epoch": 1.07, "learning_rate": 0.0001398845430369073, "loss": 0.0122, "step": 98740 }, { "epoch": 1.07, "learning_rate": 0.0001398683271713044, "loss": 0.0094, "step": 98750 }, { "epoch": 1.07, "learning_rate": 0.0001398521113057015, "loss": 0.0125, "step": 98760 }, { "epoch": 1.07, "learning_rate": 0.00013983589544009858, "loss": 0.0109, "step": 98770 }, { "epoch": 1.07, "learning_rate": 0.00013981967957449567, "loss": 0.0112, "step": 98780 }, { "epoch": 1.07, "learning_rate": 0.00013980346370889277, "loss": 0.0107, "step": 98790 }, { "epoch": 1.07, "learning_rate": 0.00013978724784328986, "loss": 0.0104, "step": 98800 }, { "epoch": 1.07, "learning_rate": 0.00013977103197768695, "loss": 0.0126, "step": 98810 }, { "epoch": 1.07, "learning_rate": 0.00013975481611208404, "loss": 0.0097, "step": 98820 }, { "epoch": 1.07, "learning_rate": 0.00013973860024648114, "loss": 0.0115, "step": 98830 }, { "epoch": 1.07, "learning_rate": 0.00013972238438087826, "loss": 0.01, "step": 98840 }, { "epoch": 1.07, "learning_rate": 0.00013970616851527532, "loss": 0.0119, "step": 98850 }, { "epoch": 1.07, "learning_rate": 0.00013968995264967244, "loss": 0.0095, "step": 98860 }, { "epoch": 1.07, "learning_rate": 0.0001396737367840695, "loss": 0.0097, "step": 98870 }, { "epoch": 1.07, "learning_rate": 0.00013965752091846663, "loss": 0.0098, "step": 98880 }, { "epoch": 1.07, "learning_rate": 0.0001396413050528637, "loss": 0.0114, "step": 98890 }, { "epoch": 1.07, "learning_rate": 0.0001396250891872608, "loss": 0.0101, "step": 98900 }, { "epoch": 1.07, "learning_rate": 0.0001396088733216579, "loss": 0.0111, "step": 98910 }, { "epoch": 1.07, "learning_rate": 0.000139592657456055, "loss": 0.0102, "step": 98920 }, { "epoch": 1.07, "learning_rate": 0.0001395764415904521, "loss": 0.0106, "step": 98930 }, { "epoch": 1.07, "learning_rate": 0.00013956022572484918, "loss": 0.0116, "step": 98940 }, { "epoch": 1.07, "learning_rate": 0.00013954400985924628, "loss": 0.0136, "step": 98950 }, { "epoch": 1.07, "learning_rate": 0.00013952779399364337, "loss": 0.0102, "step": 98960 }, { "epoch": 1.07, "learning_rate": 0.00013951157812804046, "loss": 0.0142, "step": 98970 }, { "epoch": 1.07, "learning_rate": 0.00013949536226243756, "loss": 0.0094, "step": 98980 }, { "epoch": 1.07, "learning_rate": 0.00013947914639683465, "loss": 0.0102, "step": 98990 }, { "epoch": 1.07, "learning_rate": 0.00013946293053123174, "loss": 0.0109, "step": 99000 }, { "epoch": 1.07, "eval_cer": 0.9215460437741146, "eval_loss": 0.008673109114170074, "eval_runtime": 121.2918, "eval_samples_per_second": 16.489, "eval_steps_per_second": 4.122, "step": 99000 }, { "epoch": 1.07, "learning_rate": 0.00013944671466562883, "loss": 0.0079, "step": 99010 }, { "epoch": 1.07, "learning_rate": 0.00013943049880002593, "loss": 0.009, "step": 99020 }, { "epoch": 1.07, "learning_rate": 0.00013941428293442302, "loss": 0.0111, "step": 99030 }, { "epoch": 1.07, "learning_rate": 0.0001393980670688201, "loss": 0.0092, "step": 99040 }, { "epoch": 1.07, "learning_rate": 0.0001393818512032172, "loss": 0.0087, "step": 99050 }, { "epoch": 1.07, "learning_rate": 0.00013936563533761432, "loss": 0.0103, "step": 99060 }, { "epoch": 1.07, "learning_rate": 0.0001393494194720114, "loss": 0.0107, "step": 99070 }, { "epoch": 1.07, "learning_rate": 0.0001393332036064085, "loss": 0.0113, "step": 99080 }, { "epoch": 1.07, "learning_rate": 0.00013931698774080558, "loss": 0.008, "step": 99090 }, { "epoch": 1.07, "learning_rate": 0.0001393007718752027, "loss": 0.0114, "step": 99100 }, { "epoch": 1.07, "learning_rate": 0.00013928455600959976, "loss": 0.0119, "step": 99110 }, { "epoch": 1.07, "learning_rate": 0.00013926834014399688, "loss": 0.0135, "step": 99120 }, { "epoch": 1.07, "learning_rate": 0.00013925212427839397, "loss": 0.0117, "step": 99130 }, { "epoch": 1.07, "learning_rate": 0.00013923590841279107, "loss": 0.0127, "step": 99140 }, { "epoch": 1.07, "learning_rate": 0.00013921969254718816, "loss": 0.011, "step": 99150 }, { "epoch": 1.07, "learning_rate": 0.00013920347668158525, "loss": 0.0103, "step": 99160 }, { "epoch": 1.07, "learning_rate": 0.00013918726081598234, "loss": 0.0095, "step": 99170 }, { "epoch": 1.07, "learning_rate": 0.00013917104495037944, "loss": 0.0093, "step": 99180 }, { "epoch": 1.07, "learning_rate": 0.00013915482908477653, "loss": 0.011, "step": 99190 }, { "epoch": 1.07, "learning_rate": 0.00013913861321917362, "loss": 0.0133, "step": 99200 }, { "epoch": 1.07, "learning_rate": 0.00013912239735357072, "loss": 0.0104, "step": 99210 }, { "epoch": 1.07, "learning_rate": 0.0001391061814879678, "loss": 0.0104, "step": 99220 }, { "epoch": 1.07, "learning_rate": 0.0001390899656223649, "loss": 0.0099, "step": 99230 }, { "epoch": 1.07, "learning_rate": 0.000139073749756762, "loss": 0.01, "step": 99240 }, { "epoch": 1.07, "learning_rate": 0.00013905753389115909, "loss": 0.0133, "step": 99250 }, { "epoch": 1.07, "learning_rate": 0.00013904131802555618, "loss": 0.0084, "step": 99260 }, { "epoch": 1.07, "learning_rate": 0.0001390251021599533, "loss": 0.0105, "step": 99270 }, { "epoch": 1.07, "learning_rate": 0.0001390088862943504, "loss": 0.011, "step": 99280 }, { "epoch": 1.07, "learning_rate": 0.00013899267042874748, "loss": 0.0096, "step": 99290 }, { "epoch": 1.07, "learning_rate": 0.00013897645456314458, "loss": 0.0092, "step": 99300 }, { "epoch": 1.07, "learning_rate": 0.00013896023869754167, "loss": 0.0125, "step": 99310 }, { "epoch": 1.07, "learning_rate": 0.00013894402283193876, "loss": 0.011, "step": 99320 }, { "epoch": 1.07, "learning_rate": 0.00013892780696633586, "loss": 0.01, "step": 99330 }, { "epoch": 1.07, "learning_rate": 0.00013891159110073295, "loss": 0.0117, "step": 99340 }, { "epoch": 1.07, "learning_rate": 0.00013889537523513004, "loss": 0.0097, "step": 99350 }, { "epoch": 1.07, "learning_rate": 0.00013887915936952713, "loss": 0.0105, "step": 99360 }, { "epoch": 1.07, "learning_rate": 0.00013886294350392423, "loss": 0.0098, "step": 99370 }, { "epoch": 1.07, "learning_rate": 0.00013884672763832132, "loss": 0.0157, "step": 99380 }, { "epoch": 1.07, "learning_rate": 0.0001388305117727184, "loss": 0.0094, "step": 99390 }, { "epoch": 1.07, "learning_rate": 0.0001388142959071155, "loss": 0.0111, "step": 99400 }, { "epoch": 1.07, "learning_rate": 0.0001387980800415126, "loss": 0.0108, "step": 99410 }, { "epoch": 1.07, "learning_rate": 0.0001387818641759097, "loss": 0.0133, "step": 99420 }, { "epoch": 1.07, "learning_rate": 0.0001387656483103068, "loss": 0.0093, "step": 99430 }, { "epoch": 1.07, "learning_rate": 0.00013874943244470388, "loss": 0.0166, "step": 99440 }, { "epoch": 1.08, "learning_rate": 0.000138733216579101, "loss": 0.0092, "step": 99450 }, { "epoch": 1.08, "learning_rate": 0.00013871700071349806, "loss": 0.0116, "step": 99460 }, { "epoch": 1.08, "learning_rate": 0.00013870078484789518, "loss": 0.0127, "step": 99470 }, { "epoch": 1.08, "learning_rate": 0.00013868456898229227, "loss": 0.0105, "step": 99480 }, { "epoch": 1.08, "learning_rate": 0.00013866835311668937, "loss": 0.0121, "step": 99490 }, { "epoch": 1.08, "learning_rate": 0.00013865213725108646, "loss": 0.0101, "step": 99500 }, { "epoch": 1.08, "learning_rate": 0.00013863592138548355, "loss": 0.0102, "step": 99510 }, { "epoch": 1.08, "learning_rate": 0.00013861970551988064, "loss": 0.0097, "step": 99520 }, { "epoch": 1.08, "learning_rate": 0.00013860348965427774, "loss": 0.0112, "step": 99530 }, { "epoch": 1.08, "learning_rate": 0.00013858727378867483, "loss": 0.0111, "step": 99540 }, { "epoch": 1.08, "learning_rate": 0.00013857105792307192, "loss": 0.0106, "step": 99550 }, { "epoch": 1.08, "learning_rate": 0.00013855484205746902, "loss": 0.0127, "step": 99560 }, { "epoch": 1.08, "learning_rate": 0.0001385386261918661, "loss": 0.0123, "step": 99570 }, { "epoch": 1.08, "learning_rate": 0.0001385224103262632, "loss": 0.0096, "step": 99580 }, { "epoch": 1.08, "learning_rate": 0.0001385061944606603, "loss": 0.0115, "step": 99590 }, { "epoch": 1.08, "learning_rate": 0.0001384899785950574, "loss": 0.0105, "step": 99600 }, { "epoch": 1.08, "learning_rate": 0.00013847376272945448, "loss": 0.0126, "step": 99610 }, { "epoch": 1.08, "learning_rate": 0.00013845754686385157, "loss": 0.0105, "step": 99620 }, { "epoch": 1.08, "learning_rate": 0.0001384413309982487, "loss": 0.007, "step": 99630 }, { "epoch": 1.08, "learning_rate": 0.00013842511513264576, "loss": 0.0092, "step": 99640 }, { "epoch": 1.08, "learning_rate": 0.00013840889926704288, "loss": 0.0087, "step": 99650 }, { "epoch": 1.08, "learning_rate": 0.00013839268340143994, "loss": 0.0115, "step": 99660 }, { "epoch": 1.08, "learning_rate": 0.00013837646753583706, "loss": 0.0097, "step": 99670 }, { "epoch": 1.08, "learning_rate": 0.00013836025167023413, "loss": 0.0125, "step": 99680 }, { "epoch": 1.08, "learning_rate": 0.00013834403580463125, "loss": 0.01, "step": 99690 }, { "epoch": 1.08, "learning_rate": 0.00013832781993902834, "loss": 0.0123, "step": 99700 }, { "epoch": 1.08, "learning_rate": 0.00013831160407342543, "loss": 0.0082, "step": 99710 }, { "epoch": 1.08, "learning_rate": 0.00013829538820782253, "loss": 0.0116, "step": 99720 }, { "epoch": 1.08, "learning_rate": 0.00013827917234221962, "loss": 0.0122, "step": 99730 }, { "epoch": 1.08, "learning_rate": 0.0001382629564766167, "loss": 0.0109, "step": 99740 }, { "epoch": 1.08, "learning_rate": 0.0001382467406110138, "loss": 0.0103, "step": 99750 }, { "epoch": 1.08, "learning_rate": 0.0001382305247454109, "loss": 0.0089, "step": 99760 }, { "epoch": 1.08, "learning_rate": 0.000138214308879808, "loss": 0.011, "step": 99770 }, { "epoch": 1.08, "learning_rate": 0.00013819809301420508, "loss": 0.0103, "step": 99780 }, { "epoch": 1.08, "learning_rate": 0.00013818187714860218, "loss": 0.0082, "step": 99790 }, { "epoch": 1.08, "learning_rate": 0.00013816566128299927, "loss": 0.0121, "step": 99800 }, { "epoch": 1.08, "learning_rate": 0.00013814944541739636, "loss": 0.0103, "step": 99810 }, { "epoch": 1.08, "learning_rate": 0.00013813322955179345, "loss": 0.013, "step": 99820 }, { "epoch": 1.08, "learning_rate": 0.00013811701368619055, "loss": 0.0107, "step": 99830 }, { "epoch": 1.08, "learning_rate": 0.00013810079782058764, "loss": 0.0094, "step": 99840 }, { "epoch": 1.08, "learning_rate": 0.00013808458195498476, "loss": 0.0108, "step": 99850 }, { "epoch": 1.08, "learning_rate": 0.00013806836608938182, "loss": 0.0105, "step": 99860 }, { "epoch": 1.08, "learning_rate": 0.00013805215022377894, "loss": 0.0115, "step": 99870 }, { "epoch": 1.08, "learning_rate": 0.000138035934358176, "loss": 0.0104, "step": 99880 }, { "epoch": 1.08, "learning_rate": 0.00013801971849257313, "loss": 0.0112, "step": 99890 }, { "epoch": 1.08, "learning_rate": 0.0001380035026269702, "loss": 0.0103, "step": 99900 }, { "epoch": 1.08, "learning_rate": 0.00013798728676136732, "loss": 0.0105, "step": 99910 }, { "epoch": 1.08, "learning_rate": 0.0001379710708957644, "loss": 0.0153, "step": 99920 }, { "epoch": 1.08, "learning_rate": 0.0001379548550301615, "loss": 0.0086, "step": 99930 }, { "epoch": 1.08, "learning_rate": 0.0001379386391645586, "loss": 0.011, "step": 99940 }, { "epoch": 1.08, "learning_rate": 0.0001379224232989557, "loss": 0.0124, "step": 99950 }, { "epoch": 1.08, "learning_rate": 0.00013790620743335278, "loss": 0.011, "step": 99960 }, { "epoch": 1.08, "learning_rate": 0.00013788999156774987, "loss": 0.0117, "step": 99970 }, { "epoch": 1.08, "learning_rate": 0.00013787377570214696, "loss": 0.013, "step": 99980 }, { "epoch": 1.08, "learning_rate": 0.00013785755983654406, "loss": 0.0116, "step": 99990 }, { "epoch": 1.08, "learning_rate": 0.00013784134397094118, "loss": 0.0094, "step": 100000 }, { "epoch": 1.08, "eval_cer": 0.921535620538638, "eval_loss": 0.008387841284275055, "eval_runtime": 121.0639, "eval_samples_per_second": 16.52, "eval_steps_per_second": 4.13, "step": 100000 }, { "epoch": 1.08, "learning_rate": 0.00013782512810533824, "loss": 0.0094, "step": 100010 }, { "epoch": 1.08, "learning_rate": 0.00013780891223973536, "loss": 0.0095, "step": 100020 }, { "epoch": 1.08, "learning_rate": 0.00013779269637413243, "loss": 0.0102, "step": 100030 }, { "epoch": 1.08, "learning_rate": 0.00013777648050852955, "loss": 0.0137, "step": 100040 }, { "epoch": 1.08, "learning_rate": 0.00013776026464292661, "loss": 0.0112, "step": 100050 }, { "epoch": 1.08, "learning_rate": 0.00013774404877732373, "loss": 0.0116, "step": 100060 }, { "epoch": 1.08, "learning_rate": 0.00013772783291172083, "loss": 0.0104, "step": 100070 }, { "epoch": 1.08, "learning_rate": 0.00013771161704611792, "loss": 0.0114, "step": 100080 }, { "epoch": 1.08, "learning_rate": 0.000137695401180515, "loss": 0.0093, "step": 100090 }, { "epoch": 1.08, "learning_rate": 0.0001376791853149121, "loss": 0.0115, "step": 100100 }, { "epoch": 1.08, "learning_rate": 0.0001376629694493092, "loss": 0.0119, "step": 100110 }, { "epoch": 1.08, "learning_rate": 0.0001376467535837063, "loss": 0.0115, "step": 100120 }, { "epoch": 1.08, "learning_rate": 0.00013763053771810338, "loss": 0.0086, "step": 100130 }, { "epoch": 1.08, "learning_rate": 0.00013761432185250048, "loss": 0.009, "step": 100140 }, { "epoch": 1.08, "learning_rate": 0.00013759810598689757, "loss": 0.0107, "step": 100150 }, { "epoch": 1.08, "learning_rate": 0.00013758189012129466, "loss": 0.0124, "step": 100160 }, { "epoch": 1.08, "learning_rate": 0.00013756567425569175, "loss": 0.0091, "step": 100170 }, { "epoch": 1.08, "learning_rate": 0.00013754945839008885, "loss": 0.0082, "step": 100180 }, { "epoch": 1.08, "learning_rate": 0.00013753324252448594, "loss": 0.0096, "step": 100190 }, { "epoch": 1.08, "learning_rate": 0.00013751702665888303, "loss": 0.0104, "step": 100200 }, { "epoch": 1.08, "learning_rate": 0.00013750081079328013, "loss": 0.0097, "step": 100210 }, { "epoch": 1.08, "learning_rate": 0.00013748459492767725, "loss": 0.0119, "step": 100220 }, { "epoch": 1.08, "learning_rate": 0.0001374683790620743, "loss": 0.0091, "step": 100230 }, { "epoch": 1.08, "learning_rate": 0.00013745216319647143, "loss": 0.0128, "step": 100240 }, { "epoch": 1.08, "learning_rate": 0.0001374359473308685, "loss": 0.0096, "step": 100250 }, { "epoch": 1.08, "learning_rate": 0.00013741973146526562, "loss": 0.012, "step": 100260 }, { "epoch": 1.08, "learning_rate": 0.00013740351559966268, "loss": 0.0116, "step": 100270 }, { "epoch": 1.08, "learning_rate": 0.0001373872997340598, "loss": 0.011, "step": 100280 }, { "epoch": 1.08, "learning_rate": 0.0001373710838684569, "loss": 0.0132, "step": 100290 }, { "epoch": 1.08, "learning_rate": 0.000137354868002854, "loss": 0.0112, "step": 100300 }, { "epoch": 1.08, "learning_rate": 0.00013733865213725108, "loss": 0.0101, "step": 100310 }, { "epoch": 1.08, "learning_rate": 0.00013732243627164817, "loss": 0.0119, "step": 100320 }, { "epoch": 1.08, "learning_rate": 0.00013730622040604527, "loss": 0.0083, "step": 100330 }, { "epoch": 1.08, "learning_rate": 0.00013729000454044236, "loss": 0.0113, "step": 100340 }, { "epoch": 1.08, "learning_rate": 0.00013727378867483945, "loss": 0.0116, "step": 100350 }, { "epoch": 1.08, "learning_rate": 0.00013725757280923654, "loss": 0.0088, "step": 100360 }, { "epoch": 1.09, "learning_rate": 0.00013724135694363364, "loss": 0.0106, "step": 100370 }, { "epoch": 1.09, "learning_rate": 0.00013722514107803073, "loss": 0.0095, "step": 100380 }, { "epoch": 1.09, "learning_rate": 0.00013720892521242782, "loss": 0.0089, "step": 100390 }, { "epoch": 1.09, "learning_rate": 0.00013719270934682491, "loss": 0.0087, "step": 100400 }, { "epoch": 1.09, "learning_rate": 0.000137176493481222, "loss": 0.0118, "step": 100410 }, { "epoch": 1.09, "learning_rate": 0.0001371602776156191, "loss": 0.0121, "step": 100420 }, { "epoch": 1.09, "learning_rate": 0.0001371440617500162, "loss": 0.008, "step": 100430 }, { "epoch": 1.09, "learning_rate": 0.0001371278458844133, "loss": 0.0086, "step": 100440 }, { "epoch": 1.09, "learning_rate": 0.00013711163001881038, "loss": 0.0126, "step": 100450 }, { "epoch": 1.09, "learning_rate": 0.0001370954141532075, "loss": 0.0112, "step": 100460 }, { "epoch": 1.09, "learning_rate": 0.00013707919828760456, "loss": 0.0103, "step": 100470 }, { "epoch": 1.09, "learning_rate": 0.00013706298242200168, "loss": 0.0093, "step": 100480 }, { "epoch": 1.09, "learning_rate": 0.00013704676655639878, "loss": 0.0108, "step": 100490 }, { "epoch": 1.09, "learning_rate": 0.00013703055069079587, "loss": 0.0093, "step": 100500 }, { "epoch": 1.09, "learning_rate": 0.00013701433482519296, "loss": 0.011, "step": 100510 }, { "epoch": 1.09, "learning_rate": 0.00013699811895959005, "loss": 0.0104, "step": 100520 }, { "epoch": 1.09, "learning_rate": 0.00013698190309398715, "loss": 0.0089, "step": 100530 }, { "epoch": 1.09, "learning_rate": 0.00013696568722838424, "loss": 0.0093, "step": 100540 }, { "epoch": 1.09, "learning_rate": 0.00013694947136278133, "loss": 0.0089, "step": 100550 }, { "epoch": 1.09, "learning_rate": 0.00013693325549717843, "loss": 0.0116, "step": 100560 }, { "epoch": 1.09, "learning_rate": 0.00013691703963157552, "loss": 0.0106, "step": 100570 }, { "epoch": 1.09, "learning_rate": 0.0001369008237659726, "loss": 0.0094, "step": 100580 }, { "epoch": 1.09, "learning_rate": 0.0001368846079003697, "loss": 0.0128, "step": 100590 }, { "epoch": 1.09, "learning_rate": 0.0001368683920347668, "loss": 0.0099, "step": 100600 }, { "epoch": 1.09, "learning_rate": 0.0001368521761691639, "loss": 0.0082, "step": 100610 }, { "epoch": 1.09, "learning_rate": 0.00013683596030356098, "loss": 0.0111, "step": 100620 }, { "epoch": 1.09, "learning_rate": 0.00013681974443795807, "loss": 0.0095, "step": 100630 }, { "epoch": 1.09, "learning_rate": 0.0001368035285723552, "loss": 0.0102, "step": 100640 }, { "epoch": 1.09, "learning_rate": 0.00013678731270675226, "loss": 0.0126, "step": 100650 }, { "epoch": 1.09, "learning_rate": 0.00013677109684114938, "loss": 0.0084, "step": 100660 }, { "epoch": 1.09, "learning_rate": 0.00013675488097554645, "loss": 0.0099, "step": 100670 }, { "epoch": 1.09, "learning_rate": 0.00013673866510994357, "loss": 0.0137, "step": 100680 }, { "epoch": 1.09, "learning_rate": 0.00013672244924434063, "loss": 0.0109, "step": 100690 }, { "epoch": 1.09, "learning_rate": 0.00013670623337873775, "loss": 0.0113, "step": 100700 }, { "epoch": 1.09, "learning_rate": 0.00013669001751313484, "loss": 0.0115, "step": 100710 }, { "epoch": 1.09, "learning_rate": 0.00013667380164753194, "loss": 0.0113, "step": 100720 }, { "epoch": 1.09, "learning_rate": 0.00013665758578192903, "loss": 0.0101, "step": 100730 }, { "epoch": 1.09, "learning_rate": 0.00013664136991632612, "loss": 0.0078, "step": 100740 }, { "epoch": 1.09, "learning_rate": 0.00013662515405072321, "loss": 0.0124, "step": 100750 }, { "epoch": 1.09, "learning_rate": 0.0001366089381851203, "loss": 0.0094, "step": 100760 }, { "epoch": 1.09, "learning_rate": 0.0001365927223195174, "loss": 0.0087, "step": 100770 }, { "epoch": 1.09, "learning_rate": 0.0001365765064539145, "loss": 0.0114, "step": 100780 }, { "epoch": 1.09, "learning_rate": 0.0001365602905883116, "loss": 0.0113, "step": 100790 }, { "epoch": 1.09, "learning_rate": 0.00013654407472270868, "loss": 0.0094, "step": 100800 }, { "epoch": 1.09, "learning_rate": 0.0001365278588571058, "loss": 0.0099, "step": 100810 }, { "epoch": 1.09, "learning_rate": 0.00013651164299150286, "loss": 0.0123, "step": 100820 }, { "epoch": 1.09, "learning_rate": 0.00013649542712589998, "loss": 0.0088, "step": 100830 }, { "epoch": 1.09, "learning_rate": 0.00013647921126029705, "loss": 0.0127, "step": 100840 }, { "epoch": 1.09, "learning_rate": 0.00013646299539469417, "loss": 0.0088, "step": 100850 }, { "epoch": 1.09, "learning_rate": 0.00013644677952909126, "loss": 0.0083, "step": 100860 }, { "epoch": 1.09, "learning_rate": 0.00013643056366348835, "loss": 0.0104, "step": 100870 }, { "epoch": 1.09, "learning_rate": 0.00013641434779788545, "loss": 0.0095, "step": 100880 }, { "epoch": 1.09, "learning_rate": 0.00013639813193228254, "loss": 0.0152, "step": 100890 }, { "epoch": 1.09, "learning_rate": 0.00013638191606667963, "loss": 0.0117, "step": 100900 }, { "epoch": 1.09, "learning_rate": 0.00013636570020107673, "loss": 0.0109, "step": 100910 }, { "epoch": 1.09, "learning_rate": 0.00013634948433547382, "loss": 0.008, "step": 100920 }, { "epoch": 1.09, "learning_rate": 0.0001363332684698709, "loss": 0.0096, "step": 100930 }, { "epoch": 1.09, "learning_rate": 0.000136317052604268, "loss": 0.0095, "step": 100940 }, { "epoch": 1.09, "learning_rate": 0.0001363008367386651, "loss": 0.0108, "step": 100950 }, { "epoch": 1.09, "learning_rate": 0.0001362846208730622, "loss": 0.0107, "step": 100960 }, { "epoch": 1.09, "learning_rate": 0.00013626840500745928, "loss": 0.0097, "step": 100970 }, { "epoch": 1.09, "learning_rate": 0.00013625218914185637, "loss": 0.0115, "step": 100980 }, { "epoch": 1.09, "learning_rate": 0.00013623597327625347, "loss": 0.0148, "step": 100990 }, { "epoch": 1.09, "learning_rate": 0.00013621975741065056, "loss": 0.009, "step": 101000 }, { "epoch": 1.09, "eval_cer": 0.9215312775238562, "eval_loss": 0.008509015664458275, "eval_runtime": 121.1391, "eval_samples_per_second": 16.51, "eval_steps_per_second": 4.127, "step": 101000 }, { "epoch": 1.09, "learning_rate": 0.00013620354154504768, "loss": 0.0086, "step": 101010 }, { "epoch": 1.09, "learning_rate": 0.00013618732567944475, "loss": 0.0093, "step": 101020 }, { "epoch": 1.09, "learning_rate": 0.00013617110981384187, "loss": 0.0112, "step": 101030 }, { "epoch": 1.09, "learning_rate": 0.00013615489394823893, "loss": 0.0121, "step": 101040 }, { "epoch": 1.09, "learning_rate": 0.00013613867808263605, "loss": 0.0088, "step": 101050 }, { "epoch": 1.09, "learning_rate": 0.00013612246221703312, "loss": 0.0112, "step": 101060 }, { "epoch": 1.09, "learning_rate": 0.00013610624635143024, "loss": 0.0131, "step": 101070 }, { "epoch": 1.09, "learning_rate": 0.00013609003048582733, "loss": 0.0091, "step": 101080 }, { "epoch": 1.09, "learning_rate": 0.00013607381462022442, "loss": 0.0113, "step": 101090 }, { "epoch": 1.09, "learning_rate": 0.00013605759875462151, "loss": 0.0106, "step": 101100 }, { "epoch": 1.09, "learning_rate": 0.0001360413828890186, "loss": 0.0116, "step": 101110 }, { "epoch": 1.09, "learning_rate": 0.0001360251670234157, "loss": 0.0081, "step": 101120 }, { "epoch": 1.09, "learning_rate": 0.0001360089511578128, "loss": 0.0099, "step": 101130 }, { "epoch": 1.09, "learning_rate": 0.00013599273529220989, "loss": 0.0096, "step": 101140 }, { "epoch": 1.09, "learning_rate": 0.00013597651942660698, "loss": 0.0122, "step": 101150 }, { "epoch": 1.09, "learning_rate": 0.00013596030356100407, "loss": 0.0106, "step": 101160 }, { "epoch": 1.09, "learning_rate": 0.00013594408769540116, "loss": 0.0114, "step": 101170 }, { "epoch": 1.09, "learning_rate": 0.00013592787182979826, "loss": 0.0113, "step": 101180 }, { "epoch": 1.09, "learning_rate": 0.00013591165596419535, "loss": 0.0125, "step": 101190 }, { "epoch": 1.09, "learning_rate": 0.00013589544009859244, "loss": 0.0115, "step": 101200 }, { "epoch": 1.09, "learning_rate": 0.00013587922423298954, "loss": 0.0084, "step": 101210 }, { "epoch": 1.09, "learning_rate": 0.00013586300836738663, "loss": 0.0099, "step": 101220 }, { "epoch": 1.09, "learning_rate": 0.00013584679250178375, "loss": 0.0146, "step": 101230 }, { "epoch": 1.09, "learning_rate": 0.0001358305766361808, "loss": 0.01, "step": 101240 }, { "epoch": 1.09, "learning_rate": 0.00013581436077057793, "loss": 0.0111, "step": 101250 }, { "epoch": 1.09, "learning_rate": 0.000135798144904975, "loss": 0.0125, "step": 101260 }, { "epoch": 1.09, "learning_rate": 0.00013578192903937212, "loss": 0.0107, "step": 101270 }, { "epoch": 1.09, "learning_rate": 0.00013576571317376918, "loss": 0.0079, "step": 101280 }, { "epoch": 1.09, "learning_rate": 0.0001357494973081663, "loss": 0.012, "step": 101290 }, { "epoch": 1.1, "learning_rate": 0.0001357332814425634, "loss": 0.0094, "step": 101300 }, { "epoch": 1.1, "learning_rate": 0.0001357170655769605, "loss": 0.0096, "step": 101310 }, { "epoch": 1.1, "learning_rate": 0.00013570084971135758, "loss": 0.0111, "step": 101320 }, { "epoch": 1.1, "learning_rate": 0.00013568463384575468, "loss": 0.0115, "step": 101330 }, { "epoch": 1.1, "learning_rate": 0.00013566841798015177, "loss": 0.0104, "step": 101340 }, { "epoch": 1.1, "learning_rate": 0.00013565220211454886, "loss": 0.0109, "step": 101350 }, { "epoch": 1.1, "learning_rate": 0.00013563598624894595, "loss": 0.0134, "step": 101360 }, { "epoch": 1.1, "learning_rate": 0.00013561977038334305, "loss": 0.0116, "step": 101370 }, { "epoch": 1.1, "learning_rate": 0.00013560355451774014, "loss": 0.0107, "step": 101380 }, { "epoch": 1.1, "learning_rate": 0.00013558733865213723, "loss": 0.0084, "step": 101390 }, { "epoch": 1.1, "learning_rate": 0.00013557112278653432, "loss": 0.0118, "step": 101400 }, { "epoch": 1.1, "learning_rate": 0.00013555490692093142, "loss": 0.0111, "step": 101410 }, { "epoch": 1.1, "learning_rate": 0.0001355386910553285, "loss": 0.0094, "step": 101420 }, { "epoch": 1.1, "learning_rate": 0.0001355224751897256, "loss": 0.0105, "step": 101430 }, { "epoch": 1.1, "learning_rate": 0.00013550625932412272, "loss": 0.0118, "step": 101440 }, { "epoch": 1.1, "learning_rate": 0.00013549004345851982, "loss": 0.0114, "step": 101450 }, { "epoch": 1.1, "learning_rate": 0.0001354738275929169, "loss": 0.0105, "step": 101460 }, { "epoch": 1.1, "learning_rate": 0.000135457611727314, "loss": 0.0093, "step": 101470 }, { "epoch": 1.1, "learning_rate": 0.0001354413958617111, "loss": 0.0106, "step": 101480 }, { "epoch": 1.1, "learning_rate": 0.00013542517999610819, "loss": 0.0093, "step": 101490 }, { "epoch": 1.1, "learning_rate": 0.00013540896413050528, "loss": 0.0102, "step": 101500 }, { "epoch": 1.1, "learning_rate": 0.00013539274826490237, "loss": 0.0118, "step": 101510 }, { "epoch": 1.1, "learning_rate": 0.00013537653239929946, "loss": 0.0085, "step": 101520 }, { "epoch": 1.1, "learning_rate": 0.00013536031653369656, "loss": 0.0122, "step": 101530 }, { "epoch": 1.1, "learning_rate": 0.00013534410066809365, "loss": 0.0094, "step": 101540 }, { "epoch": 1.1, "learning_rate": 0.00013532788480249074, "loss": 0.0105, "step": 101550 }, { "epoch": 1.1, "learning_rate": 0.00013531166893688784, "loss": 0.0123, "step": 101560 }, { "epoch": 1.1, "learning_rate": 0.00013529545307128493, "loss": 0.0091, "step": 101570 }, { "epoch": 1.1, "learning_rate": 0.00013527923720568202, "loss": 0.0094, "step": 101580 }, { "epoch": 1.1, "learning_rate": 0.0001352630213400791, "loss": 0.01, "step": 101590 }, { "epoch": 1.1, "learning_rate": 0.00013524680547447623, "loss": 0.011, "step": 101600 }, { "epoch": 1.1, "learning_rate": 0.0001352305896088733, "loss": 0.0117, "step": 101610 }, { "epoch": 1.1, "learning_rate": 0.00013521437374327042, "loss": 0.0119, "step": 101620 }, { "epoch": 1.1, "learning_rate": 0.00013519815787766748, "loss": 0.0101, "step": 101630 }, { "epoch": 1.1, "learning_rate": 0.0001351819420120646, "loss": 0.0098, "step": 101640 }, { "epoch": 1.1, "learning_rate": 0.0001351657261464617, "loss": 0.0114, "step": 101650 }, { "epoch": 1.1, "learning_rate": 0.0001351495102808588, "loss": 0.0095, "step": 101660 }, { "epoch": 1.1, "learning_rate": 0.00013513329441525588, "loss": 0.0088, "step": 101670 }, { "epoch": 1.1, "learning_rate": 0.00013511707854965298, "loss": 0.0107, "step": 101680 }, { "epoch": 1.1, "learning_rate": 0.00013510086268405007, "loss": 0.011, "step": 101690 }, { "epoch": 1.1, "learning_rate": 0.00013508464681844716, "loss": 0.0107, "step": 101700 }, { "epoch": 1.1, "learning_rate": 0.00013506843095284425, "loss": 0.0108, "step": 101710 }, { "epoch": 1.1, "learning_rate": 0.00013505221508724135, "loss": 0.011, "step": 101720 }, { "epoch": 1.1, "learning_rate": 0.00013503599922163844, "loss": 0.0093, "step": 101730 }, { "epoch": 1.1, "learning_rate": 0.00013501978335603553, "loss": 0.0093, "step": 101740 }, { "epoch": 1.1, "learning_rate": 0.00013500356749043262, "loss": 0.0125, "step": 101750 }, { "epoch": 1.1, "learning_rate": 0.00013498735162482972, "loss": 0.0101, "step": 101760 }, { "epoch": 1.1, "learning_rate": 0.0001349711357592268, "loss": 0.0109, "step": 101770 }, { "epoch": 1.1, "learning_rate": 0.0001349549198936239, "loss": 0.0092, "step": 101780 }, { "epoch": 1.1, "learning_rate": 0.000134938704028021, "loss": 0.011, "step": 101790 }, { "epoch": 1.1, "learning_rate": 0.00013492248816241812, "loss": 0.0096, "step": 101800 }, { "epoch": 1.1, "learning_rate": 0.00013490627229681518, "loss": 0.0089, "step": 101810 }, { "epoch": 1.1, "learning_rate": 0.0001348900564312123, "loss": 0.0124, "step": 101820 }, { "epoch": 1.1, "learning_rate": 0.00013487384056560937, "loss": 0.0116, "step": 101830 }, { "epoch": 1.1, "learning_rate": 0.00013485762470000649, "loss": 0.0113, "step": 101840 }, { "epoch": 1.1, "learning_rate": 0.00013484140883440355, "loss": 0.0127, "step": 101850 }, { "epoch": 1.1, "learning_rate": 0.00013482519296880067, "loss": 0.0101, "step": 101860 }, { "epoch": 1.1, "learning_rate": 0.00013480897710319776, "loss": 0.0088, "step": 101870 }, { "epoch": 1.1, "learning_rate": 0.00013479276123759486, "loss": 0.0096, "step": 101880 }, { "epoch": 1.1, "learning_rate": 0.00013477654537199195, "loss": 0.0098, "step": 101890 }, { "epoch": 1.1, "learning_rate": 0.00013476032950638904, "loss": 0.0101, "step": 101900 }, { "epoch": 1.1, "learning_rate": 0.00013474411364078614, "loss": 0.0137, "step": 101910 }, { "epoch": 1.1, "learning_rate": 0.00013472789777518323, "loss": 0.0133, "step": 101920 }, { "epoch": 1.1, "learning_rate": 0.00013471168190958032, "loss": 0.0084, "step": 101930 }, { "epoch": 1.1, "learning_rate": 0.00013469546604397741, "loss": 0.0119, "step": 101940 }, { "epoch": 1.1, "learning_rate": 0.0001346792501783745, "loss": 0.0107, "step": 101950 }, { "epoch": 1.1, "learning_rate": 0.0001346630343127716, "loss": 0.0084, "step": 101960 }, { "epoch": 1.1, "learning_rate": 0.0001346468184471687, "loss": 0.0083, "step": 101970 }, { "epoch": 1.1, "learning_rate": 0.00013463060258156578, "loss": 0.0089, "step": 101980 }, { "epoch": 1.1, "learning_rate": 0.00013461438671596288, "loss": 0.0114, "step": 101990 }, { "epoch": 1.1, "learning_rate": 0.00013459817085035997, "loss": 0.0085, "step": 102000 }, { "epoch": 1.1, "eval_cer": 0.921579050686457, "eval_loss": 0.008401263505220413, "eval_runtime": 121.0675, "eval_samples_per_second": 16.52, "eval_steps_per_second": 4.13, "step": 102000 }, { "epoch": 1.1, "learning_rate": 0.00013458195498475706, "loss": 0.0115, "step": 102010 }, { "epoch": 1.1, "learning_rate": 0.00013456573911915418, "loss": 0.0114, "step": 102020 }, { "epoch": 1.1, "learning_rate": 0.00013454952325355125, "loss": 0.0119, "step": 102030 }, { "epoch": 1.1, "learning_rate": 0.00013453330738794837, "loss": 0.0092, "step": 102040 }, { "epoch": 1.1, "learning_rate": 0.00013451709152234543, "loss": 0.0091, "step": 102050 }, { "epoch": 1.1, "learning_rate": 0.00013450087565674255, "loss": 0.0131, "step": 102060 }, { "epoch": 1.1, "learning_rate": 0.00013448465979113962, "loss": 0.0104, "step": 102070 }, { "epoch": 1.1, "learning_rate": 0.00013446844392553674, "loss": 0.0109, "step": 102080 }, { "epoch": 1.1, "learning_rate": 0.00013445222805993383, "loss": 0.0117, "step": 102090 }, { "epoch": 1.1, "learning_rate": 0.00013443601219433092, "loss": 0.0114, "step": 102100 }, { "epoch": 1.1, "learning_rate": 0.00013441979632872802, "loss": 0.0089, "step": 102110 }, { "epoch": 1.1, "learning_rate": 0.0001344035804631251, "loss": 0.0097, "step": 102120 }, { "epoch": 1.1, "learning_rate": 0.0001343873645975222, "loss": 0.0097, "step": 102130 }, { "epoch": 1.1, "learning_rate": 0.0001343711487319193, "loss": 0.0088, "step": 102140 }, { "epoch": 1.1, "learning_rate": 0.0001343549328663164, "loss": 0.0104, "step": 102150 }, { "epoch": 1.1, "learning_rate": 0.00013433871700071348, "loss": 0.0088, "step": 102160 }, { "epoch": 1.1, "learning_rate": 0.0001343225011351106, "loss": 0.0109, "step": 102170 }, { "epoch": 1.1, "learning_rate": 0.00013430628526950767, "loss": 0.008, "step": 102180 }, { "epoch": 1.1, "learning_rate": 0.0001342900694039048, "loss": 0.0096, "step": 102190 }, { "epoch": 1.1, "learning_rate": 0.00013427385353830185, "loss": 0.0107, "step": 102200 }, { "epoch": 1.1, "learning_rate": 0.00013425763767269897, "loss": 0.0103, "step": 102210 }, { "epoch": 1.11, "learning_rate": 0.00013424142180709604, "loss": 0.009, "step": 102220 }, { "epoch": 1.11, "learning_rate": 0.00013422520594149316, "loss": 0.0138, "step": 102230 }, { "epoch": 1.11, "learning_rate": 0.00013420899007589025, "loss": 0.01, "step": 102240 }, { "epoch": 1.11, "learning_rate": 0.00013419277421028734, "loss": 0.0147, "step": 102250 }, { "epoch": 1.11, "learning_rate": 0.00013417655834468444, "loss": 0.0104, "step": 102260 }, { "epoch": 1.11, "learning_rate": 0.00013416034247908153, "loss": 0.01, "step": 102270 }, { "epoch": 1.11, "learning_rate": 0.00013414412661347862, "loss": 0.0103, "step": 102280 }, { "epoch": 1.11, "learning_rate": 0.00013412791074787571, "loss": 0.0114, "step": 102290 }, { "epoch": 1.11, "learning_rate": 0.0001341116948822728, "loss": 0.0122, "step": 102300 }, { "epoch": 1.11, "learning_rate": 0.0001340954790166699, "loss": 0.0108, "step": 102310 }, { "epoch": 1.11, "learning_rate": 0.000134079263151067, "loss": 0.0098, "step": 102320 }, { "epoch": 1.11, "learning_rate": 0.00013406304728546408, "loss": 0.01, "step": 102330 }, { "epoch": 1.11, "learning_rate": 0.00013404683141986118, "loss": 0.009, "step": 102340 }, { "epoch": 1.11, "learning_rate": 0.00013403061555425827, "loss": 0.009, "step": 102350 }, { "epoch": 1.11, "learning_rate": 0.00013401439968865536, "loss": 0.0124, "step": 102360 }, { "epoch": 1.11, "learning_rate": 0.00013399818382305246, "loss": 0.0087, "step": 102370 }, { "epoch": 1.11, "learning_rate": 0.00013398196795744955, "loss": 0.0117, "step": 102380 }, { "epoch": 1.11, "learning_rate": 0.00013396575209184667, "loss": 0.0097, "step": 102390 }, { "epoch": 1.11, "learning_rate": 0.00013394953622624373, "loss": 0.0145, "step": 102400 }, { "epoch": 1.11, "learning_rate": 0.00013393332036064085, "loss": 0.0117, "step": 102410 }, { "epoch": 1.11, "learning_rate": 0.00013391710449503792, "loss": 0.012, "step": 102420 }, { "epoch": 1.11, "learning_rate": 0.00013390088862943504, "loss": 0.0107, "step": 102430 }, { "epoch": 1.11, "learning_rate": 0.0001338846727638321, "loss": 0.0107, "step": 102440 }, { "epoch": 1.11, "learning_rate": 0.00013386845689822922, "loss": 0.0098, "step": 102450 }, { "epoch": 1.11, "learning_rate": 0.00013385224103262632, "loss": 0.0106, "step": 102460 }, { "epoch": 1.11, "learning_rate": 0.0001338360251670234, "loss": 0.0089, "step": 102470 }, { "epoch": 1.11, "learning_rate": 0.0001338198093014205, "loss": 0.0096, "step": 102480 }, { "epoch": 1.11, "learning_rate": 0.0001338035934358176, "loss": 0.0109, "step": 102490 }, { "epoch": 1.11, "learning_rate": 0.0001337873775702147, "loss": 0.0132, "step": 102500 }, { "epoch": 1.11, "learning_rate": 0.00013377116170461178, "loss": 0.0096, "step": 102510 }, { "epoch": 1.11, "learning_rate": 0.00013375494583900887, "loss": 0.0123, "step": 102520 }, { "epoch": 1.11, "learning_rate": 0.00013373872997340597, "loss": 0.0084, "step": 102530 }, { "epoch": 1.11, "learning_rate": 0.00013372251410780306, "loss": 0.008, "step": 102540 }, { "epoch": 1.11, "learning_rate": 0.00013370629824220015, "loss": 0.0101, "step": 102550 }, { "epoch": 1.11, "learning_rate": 0.00013369008237659725, "loss": 0.0106, "step": 102560 }, { "epoch": 1.11, "learning_rate": 0.00013367386651099434, "loss": 0.0115, "step": 102570 }, { "epoch": 1.11, "learning_rate": 0.00013365765064539143, "loss": 0.0121, "step": 102580 }, { "epoch": 1.11, "learning_rate": 0.00013364143477978852, "loss": 0.0095, "step": 102590 }, { "epoch": 1.11, "learning_rate": 0.00013362521891418562, "loss": 0.0097, "step": 102600 }, { "epoch": 1.11, "learning_rate": 0.00013360900304858274, "loss": 0.0103, "step": 102610 }, { "epoch": 1.11, "learning_rate": 0.0001335927871829798, "loss": 0.0109, "step": 102620 }, { "epoch": 1.11, "learning_rate": 0.00013357657131737692, "loss": 0.0113, "step": 102630 }, { "epoch": 1.11, "learning_rate": 0.000133560355451774, "loss": 0.0098, "step": 102640 }, { "epoch": 1.11, "learning_rate": 0.0001335441395861711, "loss": 0.0116, "step": 102650 }, { "epoch": 1.11, "learning_rate": 0.0001335279237205682, "loss": 0.0096, "step": 102660 }, { "epoch": 1.11, "learning_rate": 0.0001335117078549653, "loss": 0.0085, "step": 102670 }, { "epoch": 1.11, "learning_rate": 0.00013349549198936239, "loss": 0.0084, "step": 102680 }, { "epoch": 1.11, "learning_rate": 0.00013347927612375948, "loss": 0.0094, "step": 102690 }, { "epoch": 1.11, "learning_rate": 0.00013346306025815657, "loss": 0.0122, "step": 102700 }, { "epoch": 1.11, "learning_rate": 0.00013344684439255366, "loss": 0.0109, "step": 102710 }, { "epoch": 1.11, "learning_rate": 0.00013343062852695076, "loss": 0.0121, "step": 102720 }, { "epoch": 1.11, "learning_rate": 0.00013341441266134785, "loss": 0.0124, "step": 102730 }, { "epoch": 1.11, "learning_rate": 0.00013339819679574494, "loss": 0.0132, "step": 102740 }, { "epoch": 1.11, "learning_rate": 0.00013338198093014203, "loss": 0.0093, "step": 102750 }, { "epoch": 1.11, "learning_rate": 0.00013336576506453913, "loss": 0.0106, "step": 102760 }, { "epoch": 1.11, "learning_rate": 0.00013334954919893622, "loss": 0.0107, "step": 102770 }, { "epoch": 1.11, "learning_rate": 0.0001333333333333333, "loss": 0.0134, "step": 102780 }, { "epoch": 1.11, "learning_rate": 0.0001333171174677304, "loss": 0.0084, "step": 102790 }, { "epoch": 1.11, "learning_rate": 0.0001333009016021275, "loss": 0.0118, "step": 102800 }, { "epoch": 1.11, "learning_rate": 0.00013328468573652462, "loss": 0.0088, "step": 102810 }, { "epoch": 1.11, "learning_rate": 0.00013326846987092168, "loss": 0.0089, "step": 102820 }, { "epoch": 1.11, "learning_rate": 0.0001332522540053188, "loss": 0.0113, "step": 102830 }, { "epoch": 1.11, "learning_rate": 0.00013323603813971587, "loss": 0.0097, "step": 102840 }, { "epoch": 1.11, "learning_rate": 0.000133219822274113, "loss": 0.0117, "step": 102850 }, { "epoch": 1.11, "learning_rate": 0.00013320360640851008, "loss": 0.0095, "step": 102860 }, { "epoch": 1.11, "learning_rate": 0.00013318739054290717, "loss": 0.0101, "step": 102870 }, { "epoch": 1.11, "learning_rate": 0.00013317117467730427, "loss": 0.0103, "step": 102880 }, { "epoch": 1.11, "learning_rate": 0.00013315495881170136, "loss": 0.0115, "step": 102890 }, { "epoch": 1.11, "learning_rate": 0.00013313874294609845, "loss": 0.0116, "step": 102900 }, { "epoch": 1.11, "learning_rate": 0.00013312252708049555, "loss": 0.012, "step": 102910 }, { "epoch": 1.11, "learning_rate": 0.00013310631121489264, "loss": 0.0103, "step": 102920 }, { "epoch": 1.11, "learning_rate": 0.00013309009534928973, "loss": 0.0126, "step": 102930 }, { "epoch": 1.11, "learning_rate": 0.00013307387948368682, "loss": 0.0103, "step": 102940 }, { "epoch": 1.11, "learning_rate": 0.00013305766361808392, "loss": 0.0118, "step": 102950 }, { "epoch": 1.11, "learning_rate": 0.00013304144775248104, "loss": 0.0104, "step": 102960 }, { "epoch": 1.11, "learning_rate": 0.0001330252318868781, "loss": 0.0122, "step": 102970 }, { "epoch": 1.11, "learning_rate": 0.00013300901602127522, "loss": 0.0093, "step": 102980 }, { "epoch": 1.11, "learning_rate": 0.0001329928001556723, "loss": 0.0089, "step": 102990 }, { "epoch": 1.11, "learning_rate": 0.0001329765842900694, "loss": 0.0123, "step": 103000 }, { "epoch": 1.11, "eval_cer": 0.921526065906118, "eval_loss": 0.008482340723276138, "eval_runtime": 121.2993, "eval_samples_per_second": 16.488, "eval_steps_per_second": 4.122, "step": 103000 }, { "epoch": 1.11, "learning_rate": 0.00013296036842446647, "loss": 0.0106, "step": 103010 }, { "epoch": 1.11, "learning_rate": 0.0001329441525588636, "loss": 0.0092, "step": 103020 }, { "epoch": 1.11, "learning_rate": 0.00013292793669326069, "loss": 0.011, "step": 103030 }, { "epoch": 1.11, "learning_rate": 0.00013291172082765778, "loss": 0.0089, "step": 103040 }, { "epoch": 1.11, "learning_rate": 0.00013289550496205487, "loss": 0.012, "step": 103050 }, { "epoch": 1.11, "learning_rate": 0.00013287928909645196, "loss": 0.0099, "step": 103060 }, { "epoch": 1.11, "learning_rate": 0.00013286307323084906, "loss": 0.0084, "step": 103070 }, { "epoch": 1.11, "learning_rate": 0.00013284685736524615, "loss": 0.0081, "step": 103080 }, { "epoch": 1.11, "learning_rate": 0.00013283064149964324, "loss": 0.0119, "step": 103090 }, { "epoch": 1.11, "learning_rate": 0.00013281442563404033, "loss": 0.0123, "step": 103100 }, { "epoch": 1.11, "learning_rate": 0.00013279820976843743, "loss": 0.0105, "step": 103110 }, { "epoch": 1.11, "learning_rate": 0.00013278199390283452, "loss": 0.0124, "step": 103120 }, { "epoch": 1.11, "learning_rate": 0.0001327657780372316, "loss": 0.0098, "step": 103130 }, { "epoch": 1.11, "learning_rate": 0.0001327495621716287, "loss": 0.0104, "step": 103140 }, { "epoch": 1.12, "learning_rate": 0.0001327333463060258, "loss": 0.009, "step": 103150 }, { "epoch": 1.12, "learning_rate": 0.0001327171304404229, "loss": 0.0119, "step": 103160 }, { "epoch": 1.12, "learning_rate": 0.00013270091457481998, "loss": 0.0097, "step": 103170 }, { "epoch": 1.12, "learning_rate": 0.0001326846987092171, "loss": 0.0092, "step": 103180 }, { "epoch": 1.12, "learning_rate": 0.00013266848284361417, "loss": 0.0091, "step": 103190 }, { "epoch": 1.12, "learning_rate": 0.0001326522669780113, "loss": 0.0101, "step": 103200 }, { "epoch": 1.12, "learning_rate": 0.00013263605111240835, "loss": 0.0109, "step": 103210 }, { "epoch": 1.12, "learning_rate": 0.00013261983524680547, "loss": 0.0105, "step": 103220 }, { "epoch": 1.12, "learning_rate": 0.00013260361938120254, "loss": 0.0092, "step": 103230 }, { "epoch": 1.12, "learning_rate": 0.00013258740351559966, "loss": 0.0104, "step": 103240 }, { "epoch": 1.12, "learning_rate": 0.00013257118764999675, "loss": 0.0119, "step": 103250 }, { "epoch": 1.12, "learning_rate": 0.00013255497178439385, "loss": 0.0128, "step": 103260 }, { "epoch": 1.12, "learning_rate": 0.00013253875591879094, "loss": 0.0096, "step": 103270 }, { "epoch": 1.12, "learning_rate": 0.00013252254005318803, "loss": 0.0102, "step": 103280 }, { "epoch": 1.12, "learning_rate": 0.00013250632418758512, "loss": 0.0129, "step": 103290 }, { "epoch": 1.12, "learning_rate": 0.00013249010832198222, "loss": 0.0107, "step": 103300 }, { "epoch": 1.12, "learning_rate": 0.0001324738924563793, "loss": 0.0114, "step": 103310 }, { "epoch": 1.12, "learning_rate": 0.0001324576765907764, "loss": 0.0107, "step": 103320 }, { "epoch": 1.12, "learning_rate": 0.0001324414607251735, "loss": 0.0106, "step": 103330 }, { "epoch": 1.12, "learning_rate": 0.0001324252448595706, "loss": 0.0096, "step": 103340 }, { "epoch": 1.12, "learning_rate": 0.00013240902899396768, "loss": 0.0099, "step": 103350 }, { "epoch": 1.12, "learning_rate": 0.00013239281312836477, "loss": 0.0106, "step": 103360 }, { "epoch": 1.12, "learning_rate": 0.00013237659726276187, "loss": 0.0097, "step": 103370 }, { "epoch": 1.12, "learning_rate": 0.00013236038139715896, "loss": 0.01, "step": 103380 }, { "epoch": 1.12, "learning_rate": 0.00013234416553155605, "loss": 0.009, "step": 103390 }, { "epoch": 1.12, "learning_rate": 0.00013232794966595317, "loss": 0.0102, "step": 103400 }, { "epoch": 1.12, "learning_rate": 0.00013231173380035024, "loss": 0.0127, "step": 103410 }, { "epoch": 1.12, "learning_rate": 0.00013229551793474736, "loss": 0.0092, "step": 103420 }, { "epoch": 1.12, "learning_rate": 0.00013227930206914442, "loss": 0.0101, "step": 103430 }, { "epoch": 1.12, "learning_rate": 0.00013226308620354154, "loss": 0.0148, "step": 103440 }, { "epoch": 1.12, "learning_rate": 0.0001322468703379386, "loss": 0.0105, "step": 103450 }, { "epoch": 1.12, "learning_rate": 0.00013223065447233573, "loss": 0.0141, "step": 103460 }, { "epoch": 1.12, "learning_rate": 0.00013221443860673282, "loss": 0.0117, "step": 103470 }, { "epoch": 1.12, "learning_rate": 0.0001321982227411299, "loss": 0.0099, "step": 103480 }, { "epoch": 1.12, "learning_rate": 0.000132182006875527, "loss": 0.0118, "step": 103490 }, { "epoch": 1.12, "learning_rate": 0.0001321657910099241, "loss": 0.0105, "step": 103500 }, { "epoch": 1.12, "learning_rate": 0.0001321495751443212, "loss": 0.0129, "step": 103510 }, { "epoch": 1.12, "learning_rate": 0.00013213335927871828, "loss": 0.0125, "step": 103520 }, { "epoch": 1.12, "learning_rate": 0.00013211714341311538, "loss": 0.0136, "step": 103530 }, { "epoch": 1.12, "learning_rate": 0.00013210092754751247, "loss": 0.0127, "step": 103540 }, { "epoch": 1.12, "learning_rate": 0.00013208471168190956, "loss": 0.0111, "step": 103550 }, { "epoch": 1.12, "learning_rate": 0.00013206849581630666, "loss": 0.01, "step": 103560 }, { "epoch": 1.12, "learning_rate": 0.00013205227995070375, "loss": 0.0129, "step": 103570 }, { "epoch": 1.12, "learning_rate": 0.00013203606408510084, "loss": 0.0123, "step": 103580 }, { "epoch": 1.12, "learning_rate": 0.00013201984821949796, "loss": 0.0104, "step": 103590 }, { "epoch": 1.12, "learning_rate": 0.00013200363235389503, "loss": 0.0097, "step": 103600 }, { "epoch": 1.12, "learning_rate": 0.00013198741648829215, "loss": 0.0122, "step": 103610 }, { "epoch": 1.12, "learning_rate": 0.00013197120062268924, "loss": 0.0077, "step": 103620 }, { "epoch": 1.12, "learning_rate": 0.00013195498475708633, "loss": 0.0142, "step": 103630 }, { "epoch": 1.12, "learning_rate": 0.00013193876889148342, "loss": 0.0117, "step": 103640 }, { "epoch": 1.12, "learning_rate": 0.00013192255302588052, "loss": 0.0101, "step": 103650 }, { "epoch": 1.12, "learning_rate": 0.0001319063371602776, "loss": 0.0137, "step": 103660 }, { "epoch": 1.12, "learning_rate": 0.0001318901212946747, "loss": 0.0092, "step": 103670 }, { "epoch": 1.12, "learning_rate": 0.0001318739054290718, "loss": 0.0107, "step": 103680 }, { "epoch": 1.12, "learning_rate": 0.0001318576895634689, "loss": 0.0102, "step": 103690 }, { "epoch": 1.12, "learning_rate": 0.00013184147369786598, "loss": 0.0103, "step": 103700 }, { "epoch": 1.12, "learning_rate": 0.00013182525783226307, "loss": 0.0092, "step": 103710 }, { "epoch": 1.12, "learning_rate": 0.00013180904196666017, "loss": 0.0132, "step": 103720 }, { "epoch": 1.12, "learning_rate": 0.00013179282610105726, "loss": 0.0093, "step": 103730 }, { "epoch": 1.12, "learning_rate": 0.00013177661023545435, "loss": 0.0099, "step": 103740 }, { "epoch": 1.12, "learning_rate": 0.00013176039436985144, "loss": 0.0102, "step": 103750 }, { "epoch": 1.12, "learning_rate": 0.00013174417850424854, "loss": 0.0115, "step": 103760 }, { "epoch": 1.12, "learning_rate": 0.00013172796263864566, "loss": 0.0122, "step": 103770 }, { "epoch": 1.12, "learning_rate": 0.00013171174677304272, "loss": 0.0092, "step": 103780 }, { "epoch": 1.12, "learning_rate": 0.00013169553090743984, "loss": 0.0086, "step": 103790 }, { "epoch": 1.12, "learning_rate": 0.0001316793150418369, "loss": 0.0102, "step": 103800 }, { "epoch": 1.12, "learning_rate": 0.00013166309917623403, "loss": 0.0099, "step": 103810 }, { "epoch": 1.12, "learning_rate": 0.00013164688331063112, "loss": 0.0078, "step": 103820 }, { "epoch": 1.12, "learning_rate": 0.0001316306674450282, "loss": 0.0087, "step": 103830 }, { "epoch": 1.12, "learning_rate": 0.0001316144515794253, "loss": 0.0095, "step": 103840 }, { "epoch": 1.12, "learning_rate": 0.0001315982357138224, "loss": 0.0099, "step": 103850 }, { "epoch": 1.12, "learning_rate": 0.0001315820198482195, "loss": 0.0114, "step": 103860 }, { "epoch": 1.12, "learning_rate": 0.00013156580398261658, "loss": 0.0091, "step": 103870 }, { "epoch": 1.12, "learning_rate": 0.00013154958811701368, "loss": 0.0117, "step": 103880 }, { "epoch": 1.12, "learning_rate": 0.00013153337225141077, "loss": 0.0112, "step": 103890 }, { "epoch": 1.12, "learning_rate": 0.00013151715638580786, "loss": 0.0115, "step": 103900 }, { "epoch": 1.12, "learning_rate": 0.00013150094052020496, "loss": 0.0087, "step": 103910 }, { "epoch": 1.12, "learning_rate": 0.00013148472465460205, "loss": 0.0103, "step": 103920 }, { "epoch": 1.12, "learning_rate": 0.00013146850878899914, "loss": 0.0123, "step": 103930 }, { "epoch": 1.12, "learning_rate": 0.00013145229292339623, "loss": 0.0103, "step": 103940 }, { "epoch": 1.12, "learning_rate": 0.00013143607705779333, "loss": 0.0111, "step": 103950 }, { "epoch": 1.12, "learning_rate": 0.00013141986119219042, "loss": 0.0105, "step": 103960 }, { "epoch": 1.12, "learning_rate": 0.00013140364532658754, "loss": 0.0101, "step": 103970 }, { "epoch": 1.12, "learning_rate": 0.0001313874294609846, "loss": 0.0097, "step": 103980 }, { "epoch": 1.12, "learning_rate": 0.00013137121359538172, "loss": 0.0108, "step": 103990 }, { "epoch": 1.12, "learning_rate": 0.0001313549977297788, "loss": 0.0094, "step": 104000 }, { "epoch": 1.12, "eval_cer": 0.9215208542883797, "eval_loss": 0.008366812020540237, "eval_runtime": 121.4656, "eval_samples_per_second": 16.466, "eval_steps_per_second": 4.116, "step": 104000 }, { "epoch": 1.12, "learning_rate": 0.0001313387818641759, "loss": 0.0098, "step": 104010 }, { "epoch": 1.12, "learning_rate": 0.00013132256599857298, "loss": 0.0102, "step": 104020 }, { "epoch": 1.12, "learning_rate": 0.0001313063501329701, "loss": 0.0107, "step": 104030 }, { "epoch": 1.12, "learning_rate": 0.0001312901342673672, "loss": 0.012, "step": 104040 }, { "epoch": 1.12, "learning_rate": 0.00013127391840176428, "loss": 0.0161, "step": 104050 }, { "epoch": 1.12, "learning_rate": 0.00013125770253616137, "loss": 0.0099, "step": 104060 }, { "epoch": 1.13, "learning_rate": 0.00013124148667055847, "loss": 0.0086, "step": 104070 }, { "epoch": 1.13, "learning_rate": 0.00013122527080495556, "loss": 0.0093, "step": 104080 }, { "epoch": 1.13, "learning_rate": 0.00013120905493935265, "loss": 0.0101, "step": 104090 }, { "epoch": 1.13, "learning_rate": 0.00013119283907374974, "loss": 0.0121, "step": 104100 }, { "epoch": 1.13, "learning_rate": 0.00013117662320814684, "loss": 0.0119, "step": 104110 }, { "epoch": 1.13, "learning_rate": 0.00013116040734254393, "loss": 0.0087, "step": 104120 }, { "epoch": 1.13, "learning_rate": 0.00013114419147694102, "loss": 0.012, "step": 104130 }, { "epoch": 1.13, "learning_rate": 0.00013112797561133812, "loss": 0.0112, "step": 104140 }, { "epoch": 1.13, "learning_rate": 0.0001311117597457352, "loss": 0.0094, "step": 104150 }, { "epoch": 1.13, "learning_rate": 0.0001310955438801323, "loss": 0.0144, "step": 104160 }, { "epoch": 1.13, "learning_rate": 0.0001310793280145294, "loss": 0.0104, "step": 104170 }, { "epoch": 1.13, "learning_rate": 0.00013106311214892649, "loss": 0.0109, "step": 104180 }, { "epoch": 1.13, "learning_rate": 0.0001310468962833236, "loss": 0.0085, "step": 104190 }, { "epoch": 1.13, "learning_rate": 0.00013103068041772067, "loss": 0.0111, "step": 104200 }, { "epoch": 1.13, "learning_rate": 0.0001310144645521178, "loss": 0.0079, "step": 104210 }, { "epoch": 1.13, "learning_rate": 0.00013099824868651486, "loss": 0.0111, "step": 104220 }, { "epoch": 1.13, "learning_rate": 0.00013098203282091198, "loss": 0.0089, "step": 104230 }, { "epoch": 1.13, "learning_rate": 0.00013096581695530904, "loss": 0.0078, "step": 104240 }, { "epoch": 1.13, "learning_rate": 0.00013094960108970616, "loss": 0.0094, "step": 104250 }, { "epoch": 1.13, "learning_rate": 0.00013093338522410326, "loss": 0.0089, "step": 104260 }, { "epoch": 1.13, "learning_rate": 0.00013091716935850035, "loss": 0.0109, "step": 104270 }, { "epoch": 1.13, "learning_rate": 0.00013090095349289744, "loss": 0.0085, "step": 104280 }, { "epoch": 1.13, "learning_rate": 0.00013088473762729453, "loss": 0.0082, "step": 104290 }, { "epoch": 1.13, "learning_rate": 0.00013086852176169163, "loss": 0.0098, "step": 104300 }, { "epoch": 1.13, "learning_rate": 0.00013085230589608872, "loss": 0.0076, "step": 104310 }, { "epoch": 1.13, "learning_rate": 0.0001308360900304858, "loss": 0.0107, "step": 104320 }, { "epoch": 1.13, "learning_rate": 0.0001308198741648829, "loss": 0.0101, "step": 104330 }, { "epoch": 1.13, "learning_rate": 0.00013080365829928002, "loss": 0.0104, "step": 104340 }, { "epoch": 1.13, "learning_rate": 0.0001307874424336771, "loss": 0.0093, "step": 104350 }, { "epoch": 1.13, "learning_rate": 0.0001307712265680742, "loss": 0.0115, "step": 104360 }, { "epoch": 1.13, "learning_rate": 0.00013075501070247128, "loss": 0.0092, "step": 104370 }, { "epoch": 1.13, "learning_rate": 0.0001307387948368684, "loss": 0.0113, "step": 104380 }, { "epoch": 1.13, "learning_rate": 0.00013072257897126546, "loss": 0.0111, "step": 104390 }, { "epoch": 1.13, "learning_rate": 0.00013070636310566258, "loss": 0.0128, "step": 104400 }, { "epoch": 1.13, "learning_rate": 0.00013069014724005967, "loss": 0.008, "step": 104410 }, { "epoch": 1.13, "learning_rate": 0.00013067393137445677, "loss": 0.0109, "step": 104420 }, { "epoch": 1.13, "learning_rate": 0.00013065771550885386, "loss": 0.01, "step": 104430 }, { "epoch": 1.13, "learning_rate": 0.00013064149964325095, "loss": 0.01, "step": 104440 }, { "epoch": 1.13, "learning_rate": 0.00013062528377764804, "loss": 0.0109, "step": 104450 }, { "epoch": 1.13, "learning_rate": 0.00013060906791204514, "loss": 0.0107, "step": 104460 }, { "epoch": 1.13, "learning_rate": 0.00013059285204644223, "loss": 0.0121, "step": 104470 }, { "epoch": 1.13, "learning_rate": 0.00013057663618083932, "loss": 0.0101, "step": 104480 }, { "epoch": 1.13, "learning_rate": 0.00013056042031523642, "loss": 0.0132, "step": 104490 }, { "epoch": 1.13, "learning_rate": 0.0001305442044496335, "loss": 0.0114, "step": 104500 }, { "epoch": 1.13, "learning_rate": 0.0001305279885840306, "loss": 0.0091, "step": 104510 }, { "epoch": 1.13, "learning_rate": 0.0001305117727184277, "loss": 0.0104, "step": 104520 }, { "epoch": 1.13, "learning_rate": 0.0001304955568528248, "loss": 0.0088, "step": 104530 }, { "epoch": 1.13, "learning_rate": 0.00013047934098722188, "loss": 0.0093, "step": 104540 }, { "epoch": 1.13, "learning_rate": 0.00013046312512161897, "loss": 0.0129, "step": 104550 }, { "epoch": 1.13, "learning_rate": 0.0001304469092560161, "loss": 0.0089, "step": 104560 }, { "epoch": 1.13, "learning_rate": 0.00013043069339041316, "loss": 0.01, "step": 104570 }, { "epoch": 1.13, "learning_rate": 0.00013041447752481028, "loss": 0.0114, "step": 104580 }, { "epoch": 1.13, "learning_rate": 0.00013039826165920734, "loss": 0.0095, "step": 104590 }, { "epoch": 1.13, "learning_rate": 0.00013038204579360446, "loss": 0.0125, "step": 104600 }, { "epoch": 1.13, "learning_rate": 0.00013036582992800153, "loss": 0.0105, "step": 104610 }, { "epoch": 1.13, "learning_rate": 0.00013034961406239865, "loss": 0.0135, "step": 104620 }, { "epoch": 1.13, "learning_rate": 0.00013033339819679574, "loss": 0.0107, "step": 104630 }, { "epoch": 1.13, "learning_rate": 0.00013031718233119283, "loss": 0.0112, "step": 104640 }, { "epoch": 1.13, "learning_rate": 0.00013030096646558993, "loss": 0.0124, "step": 104650 }, { "epoch": 1.13, "learning_rate": 0.00013028475059998702, "loss": 0.0093, "step": 104660 }, { "epoch": 1.13, "learning_rate": 0.0001302685347343841, "loss": 0.0098, "step": 104670 }, { "epoch": 1.13, "learning_rate": 0.0001302523188687812, "loss": 0.0094, "step": 104680 }, { "epoch": 1.13, "learning_rate": 0.0001302361030031783, "loss": 0.009, "step": 104690 }, { "epoch": 1.13, "learning_rate": 0.0001302198871375754, "loss": 0.0099, "step": 104700 }, { "epoch": 1.13, "learning_rate": 0.00013020367127197248, "loss": 0.012, "step": 104710 }, { "epoch": 1.13, "learning_rate": 0.00013018745540636958, "loss": 0.0083, "step": 104720 }, { "epoch": 1.13, "learning_rate": 0.00013017123954076667, "loss": 0.0092, "step": 104730 }, { "epoch": 1.13, "learning_rate": 0.00013015502367516376, "loss": 0.0143, "step": 104740 }, { "epoch": 1.13, "learning_rate": 0.00013013880780956085, "loss": 0.0118, "step": 104750 }, { "epoch": 1.13, "learning_rate": 0.00013012259194395795, "loss": 0.012, "step": 104760 }, { "epoch": 1.13, "learning_rate": 0.00013010637607835504, "loss": 0.0103, "step": 104770 }, { "epoch": 1.13, "learning_rate": 0.00013009016021275216, "loss": 0.013, "step": 104780 }, { "epoch": 1.13, "learning_rate": 0.00013007394434714923, "loss": 0.0131, "step": 104790 }, { "epoch": 1.13, "learning_rate": 0.00013005772848154634, "loss": 0.0115, "step": 104800 }, { "epoch": 1.13, "learning_rate": 0.0001300415126159434, "loss": 0.0109, "step": 104810 }, { "epoch": 1.13, "learning_rate": 0.00013002529675034053, "loss": 0.012, "step": 104820 }, { "epoch": 1.13, "learning_rate": 0.00013000908088473762, "loss": 0.012, "step": 104830 }, { "epoch": 1.13, "learning_rate": 0.00012999286501913472, "loss": 0.0103, "step": 104840 }, { "epoch": 1.13, "learning_rate": 0.0001299766491535318, "loss": 0.0133, "step": 104850 }, { "epoch": 1.13, "learning_rate": 0.0001299604332879289, "loss": 0.0111, "step": 104860 }, { "epoch": 1.13, "learning_rate": 0.000129944217422326, "loss": 0.0092, "step": 104870 }, { "epoch": 1.13, "learning_rate": 0.0001299280015567231, "loss": 0.009, "step": 104880 }, { "epoch": 1.13, "learning_rate": 0.00012991178569112018, "loss": 0.0112, "step": 104890 }, { "epoch": 1.13, "learning_rate": 0.00012989556982551727, "loss": 0.0102, "step": 104900 }, { "epoch": 1.13, "learning_rate": 0.00012987935395991437, "loss": 0.0114, "step": 104910 }, { "epoch": 1.13, "learning_rate": 0.00012986313809431146, "loss": 0.0099, "step": 104920 }, { "epoch": 1.13, "learning_rate": 0.00012984692222870855, "loss": 0.009, "step": 104930 }, { "epoch": 1.13, "learning_rate": 0.00012983070636310564, "loss": 0.0094, "step": 104940 }, { "epoch": 1.13, "learning_rate": 0.00012981449049750274, "loss": 0.0078, "step": 104950 }, { "epoch": 1.13, "learning_rate": 0.00012979827463189983, "loss": 0.0103, "step": 104960 }, { "epoch": 1.13, "learning_rate": 0.00012978205876629692, "loss": 0.0106, "step": 104970 }, { "epoch": 1.13, "learning_rate": 0.00012976584290069404, "loss": 0.0119, "step": 104980 }, { "epoch": 1.13, "learning_rate": 0.0001297496270350911, "loss": 0.0115, "step": 104990 }, { "epoch": 1.14, "learning_rate": 0.00012973341116948823, "loss": 0.0076, "step": 105000 }, { "epoch": 1.14, "eval_cer": 0.9215278031120306, "eval_loss": 0.008072057738900185, "eval_runtime": 121.1811, "eval_samples_per_second": 16.504, "eval_steps_per_second": 4.126, "step": 105000 }, { "epoch": 1.14, "learning_rate": 0.0001297171953038853, "loss": 0.0099, "step": 105010 }, { "epoch": 1.14, "learning_rate": 0.0001297009794382824, "loss": 0.0106, "step": 105020 }, { "epoch": 1.14, "learning_rate": 0.0001296847635726795, "loss": 0.0087, "step": 105030 }, { "epoch": 1.14, "learning_rate": 0.0001296685477070766, "loss": 0.0082, "step": 105040 }, { "epoch": 1.14, "learning_rate": 0.0001296523318414737, "loss": 0.013, "step": 105050 }, { "epoch": 1.14, "learning_rate": 0.00012963611597587078, "loss": 0.0091, "step": 105060 }, { "epoch": 1.14, "learning_rate": 0.00012961990011026788, "loss": 0.0111, "step": 105070 }, { "epoch": 1.14, "learning_rate": 0.00012960368424466497, "loss": 0.0113, "step": 105080 }, { "epoch": 1.14, "learning_rate": 0.00012958746837906206, "loss": 0.0119, "step": 105090 }, { "epoch": 1.14, "learning_rate": 0.00012957125251345915, "loss": 0.0094, "step": 105100 }, { "epoch": 1.14, "learning_rate": 0.00012955503664785625, "loss": 0.0095, "step": 105110 }, { "epoch": 1.14, "learning_rate": 0.00012953882078225334, "loss": 0.0122, "step": 105120 }, { "epoch": 1.14, "learning_rate": 0.00012952260491665046, "loss": 0.0088, "step": 105130 }, { "epoch": 1.14, "learning_rate": 0.00012950638905104753, "loss": 0.0088, "step": 105140 }, { "epoch": 1.14, "learning_rate": 0.00012949017318544465, "loss": 0.0083, "step": 105150 }, { "epoch": 1.14, "learning_rate": 0.0001294739573198417, "loss": 0.0109, "step": 105160 }, { "epoch": 1.14, "learning_rate": 0.00012945774145423883, "loss": 0.0116, "step": 105170 }, { "epoch": 1.14, "learning_rate": 0.0001294415255886359, "loss": 0.0094, "step": 105180 }, { "epoch": 1.14, "learning_rate": 0.00012942530972303302, "loss": 0.0097, "step": 105190 }, { "epoch": 1.14, "learning_rate": 0.0001294090938574301, "loss": 0.0106, "step": 105200 }, { "epoch": 1.14, "learning_rate": 0.0001293928779918272, "loss": 0.0104, "step": 105210 }, { "epoch": 1.14, "learning_rate": 0.0001293766621262243, "loss": 0.0097, "step": 105220 }, { "epoch": 1.14, "learning_rate": 0.0001293604462606214, "loss": 0.0102, "step": 105230 }, { "epoch": 1.14, "learning_rate": 0.00012934423039501848, "loss": 0.0102, "step": 105240 }, { "epoch": 1.14, "learning_rate": 0.00012932801452941557, "loss": 0.0111, "step": 105250 }, { "epoch": 1.14, "learning_rate": 0.00012931179866381267, "loss": 0.01, "step": 105260 }, { "epoch": 1.14, "learning_rate": 0.00012929558279820976, "loss": 0.0111, "step": 105270 }, { "epoch": 1.14, "learning_rate": 0.00012927936693260685, "loss": 0.0081, "step": 105280 }, { "epoch": 1.14, "learning_rate": 0.00012926315106700394, "loss": 0.0105, "step": 105290 }, { "epoch": 1.14, "learning_rate": 0.00012924693520140104, "loss": 0.0118, "step": 105300 }, { "epoch": 1.14, "learning_rate": 0.00012923071933579813, "loss": 0.0079, "step": 105310 }, { "epoch": 1.14, "learning_rate": 0.00012921450347019522, "loss": 0.0124, "step": 105320 }, { "epoch": 1.14, "learning_rate": 0.00012919828760459231, "loss": 0.01, "step": 105330 }, { "epoch": 1.14, "learning_rate": 0.0001291820717389894, "loss": 0.0109, "step": 105340 }, { "epoch": 1.14, "learning_rate": 0.00012916585587338653, "loss": 0.0094, "step": 105350 }, { "epoch": 1.14, "learning_rate": 0.0001291496400077836, "loss": 0.01, "step": 105360 }, { "epoch": 1.14, "learning_rate": 0.0001291334241421807, "loss": 0.0113, "step": 105370 }, { "epoch": 1.14, "learning_rate": 0.00012911720827657778, "loss": 0.0095, "step": 105380 }, { "epoch": 1.14, "learning_rate": 0.0001291009924109749, "loss": 0.0102, "step": 105390 }, { "epoch": 1.14, "learning_rate": 0.00012908477654537196, "loss": 0.0115, "step": 105400 }, { "epoch": 1.14, "learning_rate": 0.00012906856067976908, "loss": 0.0129, "step": 105410 }, { "epoch": 1.14, "learning_rate": 0.00012905234481416618, "loss": 0.0096, "step": 105420 }, { "epoch": 1.14, "learning_rate": 0.00012903612894856327, "loss": 0.011, "step": 105430 }, { "epoch": 1.14, "learning_rate": 0.00012901991308296036, "loss": 0.0087, "step": 105440 }, { "epoch": 1.14, "learning_rate": 0.00012900369721735745, "loss": 0.0097, "step": 105450 }, { "epoch": 1.14, "learning_rate": 0.00012898748135175455, "loss": 0.0109, "step": 105460 }, { "epoch": 1.14, "learning_rate": 0.00012897126548615164, "loss": 0.0101, "step": 105470 }, { "epoch": 1.14, "learning_rate": 0.00012895504962054873, "loss": 0.0084, "step": 105480 }, { "epoch": 1.14, "learning_rate": 0.00012893883375494583, "loss": 0.0113, "step": 105490 }, { "epoch": 1.14, "learning_rate": 0.00012892261788934292, "loss": 0.0087, "step": 105500 }, { "epoch": 1.14, "learning_rate": 0.00012890640202374, "loss": 0.0096, "step": 105510 }, { "epoch": 1.14, "learning_rate": 0.0001288901861581371, "loss": 0.0102, "step": 105520 }, { "epoch": 1.14, "learning_rate": 0.0001288739702925342, "loss": 0.0094, "step": 105530 }, { "epoch": 1.14, "learning_rate": 0.0001288577544269313, "loss": 0.0112, "step": 105540 }, { "epoch": 1.14, "learning_rate": 0.00012884153856132838, "loss": 0.0089, "step": 105550 }, { "epoch": 1.14, "learning_rate": 0.00012882532269572547, "loss": 0.0085, "step": 105560 }, { "epoch": 1.14, "learning_rate": 0.0001288091068301226, "loss": 0.0102, "step": 105570 }, { "epoch": 1.14, "learning_rate": 0.00012879289096451966, "loss": 0.0079, "step": 105580 }, { "epoch": 1.14, "learning_rate": 0.00012877667509891678, "loss": 0.0076, "step": 105590 }, { "epoch": 1.14, "learning_rate": 0.00012876045923331385, "loss": 0.0101, "step": 105600 }, { "epoch": 1.14, "learning_rate": 0.00012874424336771097, "loss": 0.009, "step": 105610 }, { "epoch": 1.14, "learning_rate": 0.00012872802750210803, "loss": 0.0078, "step": 105620 }, { "epoch": 1.14, "learning_rate": 0.00012871181163650515, "loss": 0.0096, "step": 105630 }, { "epoch": 1.14, "learning_rate": 0.00012869559577090224, "loss": 0.0092, "step": 105640 }, { "epoch": 1.14, "learning_rate": 0.00012867937990529934, "loss": 0.0084, "step": 105650 }, { "epoch": 1.14, "learning_rate": 0.00012866316403969643, "loss": 0.0088, "step": 105660 }, { "epoch": 1.14, "learning_rate": 0.00012864694817409352, "loss": 0.0094, "step": 105670 }, { "epoch": 1.14, "learning_rate": 0.00012863073230849061, "loss": 0.0108, "step": 105680 }, { "epoch": 1.14, "learning_rate": 0.0001286145164428877, "loss": 0.0102, "step": 105690 }, { "epoch": 1.14, "learning_rate": 0.0001285983005772848, "loss": 0.0075, "step": 105700 }, { "epoch": 1.14, "learning_rate": 0.0001285820847116819, "loss": 0.0109, "step": 105710 }, { "epoch": 1.14, "learning_rate": 0.00012856586884607899, "loss": 0.0087, "step": 105720 }, { "epoch": 1.14, "learning_rate": 0.00012854965298047608, "loss": 0.0092, "step": 105730 }, { "epoch": 1.14, "learning_rate": 0.0001285334371148732, "loss": 0.0101, "step": 105740 }, { "epoch": 1.14, "learning_rate": 0.00012851722124927026, "loss": 0.0108, "step": 105750 }, { "epoch": 1.14, "learning_rate": 0.00012850100538366738, "loss": 0.0106, "step": 105760 }, { "epoch": 1.14, "learning_rate": 0.00012848478951806445, "loss": 0.0092, "step": 105770 }, { "epoch": 1.14, "learning_rate": 0.00012846857365246157, "loss": 0.0129, "step": 105780 }, { "epoch": 1.14, "learning_rate": 0.00012845235778685866, "loss": 0.0096, "step": 105790 }, { "epoch": 1.14, "learning_rate": 0.00012843614192125575, "loss": 0.0111, "step": 105800 }, { "epoch": 1.14, "learning_rate": 0.00012841992605565285, "loss": 0.0114, "step": 105810 }, { "epoch": 1.14, "learning_rate": 0.00012840371019004994, "loss": 0.0106, "step": 105820 }, { "epoch": 1.14, "learning_rate": 0.00012838749432444703, "loss": 0.0098, "step": 105830 }, { "epoch": 1.14, "learning_rate": 0.00012837127845884413, "loss": 0.009, "step": 105840 }, { "epoch": 1.14, "learning_rate": 0.00012835506259324122, "loss": 0.0087, "step": 105850 }, { "epoch": 1.14, "learning_rate": 0.0001283388467276383, "loss": 0.0127, "step": 105860 }, { "epoch": 1.14, "learning_rate": 0.0001283226308620354, "loss": 0.0123, "step": 105870 }, { "epoch": 1.14, "learning_rate": 0.0001283064149964325, "loss": 0.0095, "step": 105880 }, { "epoch": 1.14, "learning_rate": 0.0001282901991308296, "loss": 0.0085, "step": 105890 }, { "epoch": 1.14, "learning_rate": 0.00012827398326522668, "loss": 0.0119, "step": 105900 }, { "epoch": 1.14, "learning_rate": 0.00012825776739962377, "loss": 0.0106, "step": 105910 }, { "epoch": 1.15, "learning_rate": 0.00012824155153402087, "loss": 0.0096, "step": 105920 }, { "epoch": 1.15, "learning_rate": 0.00012822533566841796, "loss": 0.0097, "step": 105930 }, { "epoch": 1.15, "learning_rate": 0.00012820911980281508, "loss": 0.0096, "step": 105940 }, { "epoch": 1.15, "learning_rate": 0.00012819290393721215, "loss": 0.0097, "step": 105950 }, { "epoch": 1.15, "learning_rate": 0.00012817668807160927, "loss": 0.0095, "step": 105960 }, { "epoch": 1.15, "learning_rate": 0.00012816047220600633, "loss": 0.0091, "step": 105970 }, { "epoch": 1.15, "learning_rate": 0.00012814425634040345, "loss": 0.0081, "step": 105980 }, { "epoch": 1.15, "learning_rate": 0.00012812804047480054, "loss": 0.0103, "step": 105990 }, { "epoch": 1.15, "learning_rate": 0.00012811182460919764, "loss": 0.0119, "step": 106000 }, { "epoch": 1.15, "eval_cer": 0.9215512553918529, "eval_loss": 0.00793379731476307, "eval_runtime": 121.3321, "eval_samples_per_second": 16.484, "eval_steps_per_second": 4.121, "step": 106000 }, { "epoch": 1.15, "learning_rate": 0.00012809560874359473, "loss": 0.0093, "step": 106010 }, { "epoch": 1.15, "learning_rate": 0.00012807939287799182, "loss": 0.0118, "step": 106020 }, { "epoch": 1.15, "learning_rate": 0.00012806317701238892, "loss": 0.0111, "step": 106030 }, { "epoch": 1.15, "learning_rate": 0.000128046961146786, "loss": 0.0097, "step": 106040 }, { "epoch": 1.15, "learning_rate": 0.0001280307452811831, "loss": 0.0129, "step": 106050 }, { "epoch": 1.15, "learning_rate": 0.0001280145294155802, "loss": 0.0096, "step": 106060 }, { "epoch": 1.15, "learning_rate": 0.00012799831354997729, "loss": 0.012, "step": 106070 }, { "epoch": 1.15, "learning_rate": 0.00012798209768437438, "loss": 0.0091, "step": 106080 }, { "epoch": 1.15, "learning_rate": 0.00012796588181877147, "loss": 0.0086, "step": 106090 }, { "epoch": 1.15, "learning_rate": 0.00012794966595316856, "loss": 0.0103, "step": 106100 }, { "epoch": 1.15, "learning_rate": 0.00012793345008756566, "loss": 0.0094, "step": 106110 }, { "epoch": 1.15, "learning_rate": 0.00012791723422196275, "loss": 0.0079, "step": 106120 }, { "epoch": 1.15, "learning_rate": 0.00012790101835635984, "loss": 0.0114, "step": 106130 }, { "epoch": 1.15, "learning_rate": 0.00012788480249075696, "loss": 0.0117, "step": 106140 }, { "epoch": 1.15, "learning_rate": 0.00012786858662515403, "loss": 0.0104, "step": 106150 }, { "epoch": 1.15, "learning_rate": 0.00012785237075955115, "loss": 0.0115, "step": 106160 }, { "epoch": 1.15, "learning_rate": 0.0001278361548939482, "loss": 0.0102, "step": 106170 }, { "epoch": 1.15, "learning_rate": 0.00012781993902834533, "loss": 0.0121, "step": 106180 }, { "epoch": 1.15, "learning_rate": 0.0001278037231627424, "loss": 0.0132, "step": 106190 }, { "epoch": 1.15, "learning_rate": 0.00012778750729713952, "loss": 0.0102, "step": 106200 }, { "epoch": 1.15, "learning_rate": 0.0001277712914315366, "loss": 0.013, "step": 106210 }, { "epoch": 1.15, "learning_rate": 0.0001277550755659337, "loss": 0.01, "step": 106220 }, { "epoch": 1.15, "learning_rate": 0.0001277388597003308, "loss": 0.016, "step": 106230 }, { "epoch": 1.15, "learning_rate": 0.0001277226438347279, "loss": 0.0086, "step": 106240 }, { "epoch": 1.15, "learning_rate": 0.00012770642796912498, "loss": 0.009, "step": 106250 }, { "epoch": 1.15, "learning_rate": 0.00012769021210352208, "loss": 0.0102, "step": 106260 }, { "epoch": 1.15, "learning_rate": 0.00012767399623791917, "loss": 0.0098, "step": 106270 }, { "epoch": 1.15, "learning_rate": 0.00012765778037231626, "loss": 0.011, "step": 106280 }, { "epoch": 1.15, "learning_rate": 0.00012764156450671335, "loss": 0.0111, "step": 106290 }, { "epoch": 1.15, "learning_rate": 0.00012762534864111045, "loss": 0.0089, "step": 106300 }, { "epoch": 1.15, "learning_rate": 0.00012760913277550754, "loss": 0.0104, "step": 106310 }, { "epoch": 1.15, "learning_rate": 0.00012759291690990463, "loss": 0.0122, "step": 106320 }, { "epoch": 1.15, "learning_rate": 0.00012757670104430172, "loss": 0.0109, "step": 106330 }, { "epoch": 1.15, "learning_rate": 0.00012756048517869882, "loss": 0.011, "step": 106340 }, { "epoch": 1.15, "learning_rate": 0.0001275442693130959, "loss": 0.0104, "step": 106350 }, { "epoch": 1.15, "learning_rate": 0.00012752805344749303, "loss": 0.0094, "step": 106360 }, { "epoch": 1.15, "learning_rate": 0.0001275118375818901, "loss": 0.0102, "step": 106370 }, { "epoch": 1.15, "learning_rate": 0.00012749562171628722, "loss": 0.0097, "step": 106380 }, { "epoch": 1.15, "learning_rate": 0.00012747940585068428, "loss": 0.0084, "step": 106390 }, { "epoch": 1.15, "learning_rate": 0.0001274631899850814, "loss": 0.0085, "step": 106400 }, { "epoch": 1.15, "learning_rate": 0.00012744697411947847, "loss": 0.0077, "step": 106410 }, { "epoch": 1.15, "learning_rate": 0.00012743075825387559, "loss": 0.0099, "step": 106420 }, { "epoch": 1.15, "learning_rate": 0.00012741454238827268, "loss": 0.0102, "step": 106430 }, { "epoch": 1.15, "learning_rate": 0.00012739832652266977, "loss": 0.0099, "step": 106440 }, { "epoch": 1.15, "learning_rate": 0.00012738211065706686, "loss": 0.0104, "step": 106450 }, { "epoch": 1.15, "learning_rate": 0.00012736589479146396, "loss": 0.012, "step": 106460 }, { "epoch": 1.15, "learning_rate": 0.00012734967892586105, "loss": 0.0118, "step": 106470 }, { "epoch": 1.15, "learning_rate": 0.00012733346306025814, "loss": 0.0109, "step": 106480 }, { "epoch": 1.15, "learning_rate": 0.00012731724719465524, "loss": 0.0117, "step": 106490 }, { "epoch": 1.15, "learning_rate": 0.00012730103132905233, "loss": 0.0108, "step": 106500 }, { "epoch": 1.15, "learning_rate": 0.00012728481546344945, "loss": 0.0118, "step": 106510 }, { "epoch": 1.15, "learning_rate": 0.00012726859959784651, "loss": 0.0099, "step": 106520 }, { "epoch": 1.15, "learning_rate": 0.00012725238373224363, "loss": 0.0099, "step": 106530 }, { "epoch": 1.15, "learning_rate": 0.0001272361678666407, "loss": 0.0082, "step": 106540 }, { "epoch": 1.15, "learning_rate": 0.00012721995200103782, "loss": 0.0119, "step": 106550 }, { "epoch": 1.15, "learning_rate": 0.00012720373613543488, "loss": 0.0129, "step": 106560 }, { "epoch": 1.15, "learning_rate": 0.000127187520269832, "loss": 0.0103, "step": 106570 }, { "epoch": 1.15, "learning_rate": 0.0001271713044042291, "loss": 0.0095, "step": 106580 }, { "epoch": 1.15, "learning_rate": 0.0001271550885386262, "loss": 0.009, "step": 106590 }, { "epoch": 1.15, "learning_rate": 0.00012713887267302328, "loss": 0.0092, "step": 106600 }, { "epoch": 1.15, "learning_rate": 0.00012712265680742038, "loss": 0.0129, "step": 106610 }, { "epoch": 1.15, "learning_rate": 0.00012710644094181747, "loss": 0.0112, "step": 106620 }, { "epoch": 1.15, "learning_rate": 0.00012709022507621456, "loss": 0.0092, "step": 106630 }, { "epoch": 1.15, "learning_rate": 0.00012707400921061165, "loss": 0.0087, "step": 106640 }, { "epoch": 1.15, "learning_rate": 0.00012705779334500875, "loss": 0.0096, "step": 106650 }, { "epoch": 1.15, "learning_rate": 0.00012704157747940584, "loss": 0.0128, "step": 106660 }, { "epoch": 1.15, "learning_rate": 0.00012702536161380293, "loss": 0.0097, "step": 106670 }, { "epoch": 1.15, "learning_rate": 0.00012700914574820002, "loss": 0.0084, "step": 106680 }, { "epoch": 1.15, "learning_rate": 0.00012699292988259712, "loss": 0.0119, "step": 106690 }, { "epoch": 1.15, "learning_rate": 0.0001269767140169942, "loss": 0.0113, "step": 106700 }, { "epoch": 1.15, "learning_rate": 0.0001269604981513913, "loss": 0.0111, "step": 106710 }, { "epoch": 1.15, "learning_rate": 0.0001269442822857884, "loss": 0.0093, "step": 106720 }, { "epoch": 1.15, "learning_rate": 0.00012692806642018552, "loss": 0.0143, "step": 106730 }, { "epoch": 1.15, "learning_rate": 0.00012691185055458258, "loss": 0.0095, "step": 106740 }, { "epoch": 1.15, "learning_rate": 0.0001268956346889797, "loss": 0.0095, "step": 106750 }, { "epoch": 1.15, "learning_rate": 0.00012687941882337677, "loss": 0.0101, "step": 106760 }, { "epoch": 1.15, "learning_rate": 0.0001268632029577739, "loss": 0.0124, "step": 106770 }, { "epoch": 1.15, "learning_rate": 0.00012684698709217095, "loss": 0.0103, "step": 106780 }, { "epoch": 1.15, "learning_rate": 0.00012683077122656807, "loss": 0.0097, "step": 106790 }, { "epoch": 1.15, "learning_rate": 0.00012681455536096516, "loss": 0.009, "step": 106800 }, { "epoch": 1.15, "learning_rate": 0.00012679833949536226, "loss": 0.0091, "step": 106810 }, { "epoch": 1.15, "learning_rate": 0.00012678212362975935, "loss": 0.0094, "step": 106820 }, { "epoch": 1.15, "learning_rate": 0.00012676590776415644, "loss": 0.0112, "step": 106830 }, { "epoch": 1.15, "learning_rate": 0.00012674969189855354, "loss": 0.0099, "step": 106840 }, { "epoch": 1.16, "learning_rate": 0.00012673347603295063, "loss": 0.0084, "step": 106850 }, { "epoch": 1.16, "learning_rate": 0.00012671726016734772, "loss": 0.0102, "step": 106860 }, { "epoch": 1.16, "learning_rate": 0.00012670104430174481, "loss": 0.01, "step": 106870 }, { "epoch": 1.16, "learning_rate": 0.0001266848284361419, "loss": 0.0095, "step": 106880 }, { "epoch": 1.16, "learning_rate": 0.000126668612570539, "loss": 0.0098, "step": 106890 }, { "epoch": 1.16, "learning_rate": 0.0001266523967049361, "loss": 0.0132, "step": 106900 }, { "epoch": 1.16, "learning_rate": 0.00012663618083933318, "loss": 0.0093, "step": 106910 }, { "epoch": 1.16, "learning_rate": 0.00012661996497373028, "loss": 0.0088, "step": 106920 }, { "epoch": 1.16, "learning_rate": 0.00012660374910812737, "loss": 0.0093, "step": 106930 }, { "epoch": 1.16, "learning_rate": 0.00012658753324252446, "loss": 0.0128, "step": 106940 }, { "epoch": 1.16, "learning_rate": 0.00012657131737692158, "loss": 0.0097, "step": 106950 }, { "epoch": 1.16, "learning_rate": 0.00012655510151131865, "loss": 0.0126, "step": 106960 }, { "epoch": 1.16, "learning_rate": 0.00012653888564571577, "loss": 0.0101, "step": 106970 }, { "epoch": 1.16, "learning_rate": 0.00012652266978011283, "loss": 0.0102, "step": 106980 }, { "epoch": 1.16, "learning_rate": 0.00012650645391450995, "loss": 0.0092, "step": 106990 }, { "epoch": 1.16, "learning_rate": 0.00012649023804890705, "loss": 0.0079, "step": 107000 }, { "epoch": 1.16, "eval_cer": 0.9215686274509803, "eval_loss": 0.008123186416924, "eval_runtime": 121.1965, "eval_samples_per_second": 16.502, "eval_steps_per_second": 4.126, "step": 107000 }, { "epoch": 1.16, "learning_rate": 0.00012647402218330414, "loss": 0.0084, "step": 107010 }, { "epoch": 1.16, "learning_rate": 0.00012645780631770123, "loss": 0.0105, "step": 107020 }, { "epoch": 1.16, "learning_rate": 0.00012644159045209832, "loss": 0.0107, "step": 107030 }, { "epoch": 1.16, "learning_rate": 0.00012642537458649542, "loss": 0.0097, "step": 107040 }, { "epoch": 1.16, "learning_rate": 0.0001264091587208925, "loss": 0.01, "step": 107050 }, { "epoch": 1.16, "learning_rate": 0.0001263929428552896, "loss": 0.0088, "step": 107060 }, { "epoch": 1.16, "learning_rate": 0.0001263767269896867, "loss": 0.0112, "step": 107070 }, { "epoch": 1.16, "learning_rate": 0.0001263605111240838, "loss": 0.0116, "step": 107080 }, { "epoch": 1.16, "learning_rate": 0.00012634429525848088, "loss": 0.0108, "step": 107090 }, { "epoch": 1.16, "learning_rate": 0.00012632807939287797, "loss": 0.0098, "step": 107100 }, { "epoch": 1.16, "learning_rate": 0.00012631186352727507, "loss": 0.0119, "step": 107110 }, { "epoch": 1.16, "learning_rate": 0.00012629564766167216, "loss": 0.0125, "step": 107120 }, { "epoch": 1.16, "learning_rate": 0.00012627943179606925, "loss": 0.0091, "step": 107130 }, { "epoch": 1.16, "learning_rate": 0.00012626321593046635, "loss": 0.0095, "step": 107140 }, { "epoch": 1.16, "learning_rate": 0.00012624700006486346, "loss": 0.0117, "step": 107150 }, { "epoch": 1.16, "learning_rate": 0.00012623078419926053, "loss": 0.0097, "step": 107160 }, { "epoch": 1.16, "learning_rate": 0.00012621456833365765, "loss": 0.0088, "step": 107170 }, { "epoch": 1.16, "learning_rate": 0.00012619835246805474, "loss": 0.0094, "step": 107180 }, { "epoch": 1.16, "learning_rate": 0.00012618213660245184, "loss": 0.0093, "step": 107190 }, { "epoch": 1.16, "learning_rate": 0.00012616592073684893, "loss": 0.0114, "step": 107200 }, { "epoch": 1.16, "learning_rate": 0.00012614970487124602, "loss": 0.0128, "step": 107210 }, { "epoch": 1.16, "learning_rate": 0.00012613348900564311, "loss": 0.0105, "step": 107220 }, { "epoch": 1.16, "learning_rate": 0.0001261172731400402, "loss": 0.0096, "step": 107230 }, { "epoch": 1.16, "learning_rate": 0.0001261010572744373, "loss": 0.012, "step": 107240 }, { "epoch": 1.16, "learning_rate": 0.0001260848414088344, "loss": 0.0112, "step": 107250 }, { "epoch": 1.16, "learning_rate": 0.00012606862554323149, "loss": 0.0076, "step": 107260 }, { "epoch": 1.16, "learning_rate": 0.00012605240967762858, "loss": 0.0108, "step": 107270 }, { "epoch": 1.16, "learning_rate": 0.00012603619381202567, "loss": 0.01, "step": 107280 }, { "epoch": 1.16, "learning_rate": 0.00012601997794642276, "loss": 0.0076, "step": 107290 }, { "epoch": 1.16, "learning_rate": 0.00012600376208081988, "loss": 0.0092, "step": 107300 }, { "epoch": 1.16, "learning_rate": 0.00012598754621521695, "loss": 0.0086, "step": 107310 }, { "epoch": 1.16, "learning_rate": 0.00012597133034961407, "loss": 0.009, "step": 107320 }, { "epoch": 1.16, "learning_rate": 0.00012595511448401113, "loss": 0.0107, "step": 107330 }, { "epoch": 1.16, "learning_rate": 0.00012593889861840825, "loss": 0.0096, "step": 107340 }, { "epoch": 1.16, "learning_rate": 0.00012592268275280532, "loss": 0.0105, "step": 107350 }, { "epoch": 1.16, "learning_rate": 0.00012590646688720244, "loss": 0.0087, "step": 107360 }, { "epoch": 1.16, "learning_rate": 0.00012589025102159953, "loss": 0.0118, "step": 107370 }, { "epoch": 1.16, "learning_rate": 0.00012587403515599663, "loss": 0.0103, "step": 107380 }, { "epoch": 1.16, "learning_rate": 0.00012585781929039372, "loss": 0.0088, "step": 107390 }, { "epoch": 1.16, "learning_rate": 0.0001258416034247908, "loss": 0.0113, "step": 107400 }, { "epoch": 1.16, "learning_rate": 0.0001258253875591879, "loss": 0.0091, "step": 107410 }, { "epoch": 1.16, "learning_rate": 0.000125809171693585, "loss": 0.0106, "step": 107420 }, { "epoch": 1.16, "learning_rate": 0.0001257929558279821, "loss": 0.0086, "step": 107430 }, { "epoch": 1.16, "learning_rate": 0.00012577673996237918, "loss": 0.0111, "step": 107440 }, { "epoch": 1.16, "learning_rate": 0.00012576052409677627, "loss": 0.0087, "step": 107450 }, { "epoch": 1.16, "learning_rate": 0.00012574430823117337, "loss": 0.0124, "step": 107460 }, { "epoch": 1.16, "learning_rate": 0.00012572809236557046, "loss": 0.0095, "step": 107470 }, { "epoch": 1.16, "learning_rate": 0.00012571187649996755, "loss": 0.008, "step": 107480 }, { "epoch": 1.16, "learning_rate": 0.00012569566063436465, "loss": 0.0073, "step": 107490 }, { "epoch": 1.16, "learning_rate": 0.00012567944476876174, "loss": 0.0109, "step": 107500 }, { "epoch": 1.16, "learning_rate": 0.00012566322890315883, "loss": 0.0106, "step": 107510 }, { "epoch": 1.16, "learning_rate": 0.00012564701303755595, "loss": 0.01, "step": 107520 }, { "epoch": 1.16, "learning_rate": 0.00012563079717195302, "loss": 0.0108, "step": 107530 }, { "epoch": 1.16, "learning_rate": 0.00012561458130635014, "loss": 0.0114, "step": 107540 }, { "epoch": 1.16, "learning_rate": 0.0001255983654407472, "loss": 0.0121, "step": 107550 }, { "epoch": 1.16, "learning_rate": 0.00012558214957514432, "loss": 0.0114, "step": 107560 }, { "epoch": 1.16, "learning_rate": 0.0001255659337095414, "loss": 0.0111, "step": 107570 }, { "epoch": 1.16, "learning_rate": 0.0001255497178439385, "loss": 0.0115, "step": 107580 }, { "epoch": 1.16, "learning_rate": 0.0001255335019783356, "loss": 0.0133, "step": 107590 }, { "epoch": 1.16, "learning_rate": 0.0001255172861127327, "loss": 0.0106, "step": 107600 }, { "epoch": 1.16, "learning_rate": 0.00012550107024712979, "loss": 0.0089, "step": 107610 }, { "epoch": 1.16, "learning_rate": 0.00012548485438152688, "loss": 0.0091, "step": 107620 }, { "epoch": 1.16, "learning_rate": 0.00012546863851592397, "loss": 0.012, "step": 107630 }, { "epoch": 1.16, "learning_rate": 0.00012545242265032106, "loss": 0.0101, "step": 107640 }, { "epoch": 1.16, "learning_rate": 0.00012543620678471816, "loss": 0.011, "step": 107650 }, { "epoch": 1.16, "learning_rate": 0.00012541999091911525, "loss": 0.0093, "step": 107660 }, { "epoch": 1.16, "learning_rate": 0.00012540377505351234, "loss": 0.0104, "step": 107670 }, { "epoch": 1.16, "learning_rate": 0.00012538755918790943, "loss": 0.0085, "step": 107680 }, { "epoch": 1.16, "learning_rate": 0.00012537134332230653, "loss": 0.0133, "step": 107690 }, { "epoch": 1.16, "learning_rate": 0.00012535512745670362, "loss": 0.0109, "step": 107700 }, { "epoch": 1.16, "learning_rate": 0.0001253389115911007, "loss": 0.0095, "step": 107710 }, { "epoch": 1.16, "learning_rate": 0.0001253226957254978, "loss": 0.0124, "step": 107720 }, { "epoch": 1.16, "learning_rate": 0.0001253064798598949, "loss": 0.0127, "step": 107730 }, { "epoch": 1.16, "learning_rate": 0.00012529026399429202, "loss": 0.0125, "step": 107740 }, { "epoch": 1.16, "learning_rate": 0.00012527404812868908, "loss": 0.01, "step": 107750 }, { "epoch": 1.16, "learning_rate": 0.0001252578322630862, "loss": 0.0104, "step": 107760 }, { "epoch": 1.17, "learning_rate": 0.00012524161639748327, "loss": 0.0106, "step": 107770 }, { "epoch": 1.17, "learning_rate": 0.0001252254005318804, "loss": 0.0104, "step": 107780 }, { "epoch": 1.17, "learning_rate": 0.00012520918466627745, "loss": 0.0102, "step": 107790 }, { "epoch": 1.17, "learning_rate": 0.00012519296880067457, "loss": 0.0082, "step": 107800 }, { "epoch": 1.17, "learning_rate": 0.00012517675293507167, "loss": 0.0088, "step": 107810 }, { "epoch": 1.17, "learning_rate": 0.00012516053706946876, "loss": 0.0109, "step": 107820 }, { "epoch": 1.17, "learning_rate": 0.00012514432120386585, "loss": 0.0102, "step": 107830 }, { "epoch": 1.17, "learning_rate": 0.00012512810533826295, "loss": 0.013, "step": 107840 }, { "epoch": 1.17, "learning_rate": 0.00012511188947266004, "loss": 0.0113, "step": 107850 }, { "epoch": 1.17, "learning_rate": 0.00012509567360705713, "loss": 0.0126, "step": 107860 }, { "epoch": 1.17, "learning_rate": 0.00012507945774145422, "loss": 0.0093, "step": 107870 }, { "epoch": 1.17, "learning_rate": 0.00012506324187585132, "loss": 0.0131, "step": 107880 }, { "epoch": 1.17, "learning_rate": 0.0001250470260102484, "loss": 0.0106, "step": 107890 }, { "epoch": 1.17, "learning_rate": 0.0001250308101446455, "loss": 0.009, "step": 107900 }, { "epoch": 1.17, "learning_rate": 0.00012501459427904262, "loss": 0.0117, "step": 107910 }, { "epoch": 1.17, "learning_rate": 0.0001249983784134397, "loss": 0.0106, "step": 107920 }, { "epoch": 1.17, "learning_rate": 0.0001249821625478368, "loss": 0.0101, "step": 107930 }, { "epoch": 1.17, "learning_rate": 0.00012496594668223387, "loss": 0.0085, "step": 107940 }, { "epoch": 1.17, "learning_rate": 0.000124949730816631, "loss": 0.0152, "step": 107950 }, { "epoch": 1.17, "learning_rate": 0.00012493351495102809, "loss": 0.0113, "step": 107960 }, { "epoch": 1.17, "learning_rate": 0.00012491729908542518, "loss": 0.01, "step": 107970 }, { "epoch": 1.17, "learning_rate": 0.00012490108321982227, "loss": 0.0103, "step": 107980 }, { "epoch": 1.17, "learning_rate": 0.00012488486735421936, "loss": 0.0102, "step": 107990 }, { "epoch": 1.17, "learning_rate": 0.00012486865148861646, "loss": 0.0108, "step": 108000 }, { "epoch": 1.17, "eval_cer": 0.9215590728184603, "eval_loss": 0.008009477518498898, "eval_runtime": 121.2932, "eval_samples_per_second": 16.489, "eval_steps_per_second": 4.122, "step": 108000 }, { "epoch": 1.17, "learning_rate": 0.00012485243562301355, "loss": 0.0115, "step": 108010 }, { "epoch": 1.17, "learning_rate": 0.00012483621975741064, "loss": 0.0106, "step": 108020 }, { "epoch": 1.17, "learning_rate": 0.00012482000389180773, "loss": 0.0094, "step": 108030 }, { "epoch": 1.17, "learning_rate": 0.00012480378802620483, "loss": 0.0103, "step": 108040 }, { "epoch": 1.17, "learning_rate": 0.00012478757216060192, "loss": 0.0087, "step": 108050 }, { "epoch": 1.17, "learning_rate": 0.000124771356294999, "loss": 0.0106, "step": 108060 }, { "epoch": 1.17, "learning_rate": 0.0001247551404293961, "loss": 0.0104, "step": 108070 }, { "epoch": 1.17, "learning_rate": 0.0001247389245637932, "loss": 0.0096, "step": 108080 }, { "epoch": 1.17, "learning_rate": 0.0001247227086981903, "loss": 0.0117, "step": 108090 }, { "epoch": 1.17, "learning_rate": 0.00012470649283258738, "loss": 0.0104, "step": 108100 }, { "epoch": 1.17, "learning_rate": 0.0001246902769669845, "loss": 0.0099, "step": 108110 }, { "epoch": 1.17, "learning_rate": 0.00012467406110138157, "loss": 0.0132, "step": 108120 }, { "epoch": 1.17, "learning_rate": 0.0001246578452357787, "loss": 0.0084, "step": 108130 }, { "epoch": 1.17, "learning_rate": 0.00012464162937017575, "loss": 0.0139, "step": 108140 }, { "epoch": 1.17, "learning_rate": 0.00012462541350457287, "loss": 0.0077, "step": 108150 }, { "epoch": 1.17, "learning_rate": 0.00012460919763896997, "loss": 0.0116, "step": 108160 }, { "epoch": 1.17, "learning_rate": 0.00012459298177336706, "loss": 0.0077, "step": 108170 }, { "epoch": 1.17, "learning_rate": 0.00012457676590776415, "loss": 0.0134, "step": 108180 }, { "epoch": 1.17, "learning_rate": 0.00012456055004216125, "loss": 0.0098, "step": 108190 }, { "epoch": 1.17, "learning_rate": 0.00012454433417655834, "loss": 0.0084, "step": 108200 }, { "epoch": 1.17, "learning_rate": 0.00012452811831095543, "loss": 0.0111, "step": 108210 }, { "epoch": 1.17, "learning_rate": 0.00012451190244535252, "loss": 0.0114, "step": 108220 }, { "epoch": 1.17, "learning_rate": 0.00012449568657974962, "loss": 0.0133, "step": 108230 }, { "epoch": 1.17, "learning_rate": 0.0001244794707141467, "loss": 0.0082, "step": 108240 }, { "epoch": 1.17, "learning_rate": 0.0001244632548485438, "loss": 0.0115, "step": 108250 }, { "epoch": 1.17, "learning_rate": 0.0001244470389829409, "loss": 0.0093, "step": 108260 }, { "epoch": 1.17, "learning_rate": 0.000124430823117338, "loss": 0.0098, "step": 108270 }, { "epoch": 1.17, "learning_rate": 0.00012441460725173508, "loss": 0.0088, "step": 108280 }, { "epoch": 1.17, "learning_rate": 0.00012439839138613217, "loss": 0.0083, "step": 108290 }, { "epoch": 1.17, "learning_rate": 0.00012438217552052927, "loss": 0.0087, "step": 108300 }, { "epoch": 1.17, "learning_rate": 0.00012436595965492639, "loss": 0.011, "step": 108310 }, { "epoch": 1.17, "learning_rate": 0.00012434974378932345, "loss": 0.0123, "step": 108320 }, { "epoch": 1.17, "learning_rate": 0.00012433352792372057, "loss": 0.0096, "step": 108330 }, { "epoch": 1.17, "learning_rate": 0.00012431731205811764, "loss": 0.0066, "step": 108340 }, { "epoch": 1.17, "learning_rate": 0.00012430109619251476, "loss": 0.0094, "step": 108350 }, { "epoch": 1.17, "learning_rate": 0.00012428488032691182, "loss": 0.0109, "step": 108360 }, { "epoch": 1.17, "learning_rate": 0.00012426866446130894, "loss": 0.0072, "step": 108370 }, { "epoch": 1.17, "learning_rate": 0.00012425244859570603, "loss": 0.0106, "step": 108380 }, { "epoch": 1.17, "learning_rate": 0.00012423623273010313, "loss": 0.0095, "step": 108390 }, { "epoch": 1.17, "learning_rate": 0.00012422001686450022, "loss": 0.0114, "step": 108400 }, { "epoch": 1.17, "learning_rate": 0.0001242038009988973, "loss": 0.0112, "step": 108410 }, { "epoch": 1.17, "learning_rate": 0.0001241875851332944, "loss": 0.0094, "step": 108420 }, { "epoch": 1.17, "learning_rate": 0.0001241713692676915, "loss": 0.0105, "step": 108430 }, { "epoch": 1.17, "learning_rate": 0.0001241551534020886, "loss": 0.0116, "step": 108440 }, { "epoch": 1.17, "learning_rate": 0.00012413893753648568, "loss": 0.0086, "step": 108450 }, { "epoch": 1.17, "learning_rate": 0.00012412272167088278, "loss": 0.0083, "step": 108460 }, { "epoch": 1.17, "learning_rate": 0.00012410650580527987, "loss": 0.0086, "step": 108470 }, { "epoch": 1.17, "learning_rate": 0.00012409028993967696, "loss": 0.0108, "step": 108480 }, { "epoch": 1.17, "learning_rate": 0.00012407407407407406, "loss": 0.0129, "step": 108490 }, { "epoch": 1.17, "learning_rate": 0.00012405785820847115, "loss": 0.01, "step": 108500 }, { "epoch": 1.17, "learning_rate": 0.00012404164234286824, "loss": 0.0087, "step": 108510 }, { "epoch": 1.17, "learning_rate": 0.00012402542647726533, "loss": 0.0096, "step": 108520 }, { "epoch": 1.17, "learning_rate": 0.00012400921061166245, "loss": 0.0112, "step": 108530 }, { "epoch": 1.17, "learning_rate": 0.00012399299474605952, "loss": 0.0087, "step": 108540 }, { "epoch": 1.17, "learning_rate": 0.00012397677888045664, "loss": 0.0122, "step": 108550 }, { "epoch": 1.17, "learning_rate": 0.0001239605630148537, "loss": 0.0107, "step": 108560 }, { "epoch": 1.17, "learning_rate": 0.00012394434714925082, "loss": 0.0114, "step": 108570 }, { "epoch": 1.17, "learning_rate": 0.0001239281312836479, "loss": 0.009, "step": 108580 }, { "epoch": 1.17, "learning_rate": 0.000123911915418045, "loss": 0.0093, "step": 108590 }, { "epoch": 1.17, "learning_rate": 0.0001238956995524421, "loss": 0.015, "step": 108600 }, { "epoch": 1.17, "learning_rate": 0.0001238794836868392, "loss": 0.008, "step": 108610 }, { "epoch": 1.17, "learning_rate": 0.0001238632678212363, "loss": 0.0098, "step": 108620 }, { "epoch": 1.17, "learning_rate": 0.00012384705195563338, "loss": 0.0101, "step": 108630 }, { "epoch": 1.17, "learning_rate": 0.00012383083609003047, "loss": 0.0102, "step": 108640 }, { "epoch": 1.17, "learning_rate": 0.00012381462022442757, "loss": 0.0085, "step": 108650 }, { "epoch": 1.17, "learning_rate": 0.00012379840435882466, "loss": 0.0095, "step": 108660 }, { "epoch": 1.17, "learning_rate": 0.00012378218849322175, "loss": 0.011, "step": 108670 }, { "epoch": 1.17, "learning_rate": 0.00012376597262761887, "loss": 0.0104, "step": 108680 }, { "epoch": 1.17, "learning_rate": 0.00012374975676201594, "loss": 0.0091, "step": 108690 }, { "epoch": 1.18, "learning_rate": 0.00012373354089641306, "loss": 0.0077, "step": 108700 }, { "epoch": 1.18, "learning_rate": 0.00012371732503081012, "loss": 0.0096, "step": 108710 }, { "epoch": 1.18, "learning_rate": 0.00012370110916520724, "loss": 0.0103, "step": 108720 }, { "epoch": 1.18, "learning_rate": 0.0001236848932996043, "loss": 0.0082, "step": 108730 }, { "epoch": 1.18, "learning_rate": 0.00012366867743400143, "loss": 0.0092, "step": 108740 }, { "epoch": 1.18, "learning_rate": 0.00012365246156839852, "loss": 0.0104, "step": 108750 }, { "epoch": 1.18, "learning_rate": 0.0001236362457027956, "loss": 0.0099, "step": 108760 }, { "epoch": 1.18, "learning_rate": 0.0001236200298371927, "loss": 0.009, "step": 108770 }, { "epoch": 1.18, "learning_rate": 0.0001236038139715898, "loss": 0.0105, "step": 108780 }, { "epoch": 1.18, "learning_rate": 0.0001235875981059869, "loss": 0.0107, "step": 108790 }, { "epoch": 1.18, "learning_rate": 0.00012357138224038398, "loss": 0.0108, "step": 108800 }, { "epoch": 1.18, "learning_rate": 0.00012355516637478108, "loss": 0.0097, "step": 108810 }, { "epoch": 1.18, "learning_rate": 0.00012353895050917817, "loss": 0.0106, "step": 108820 }, { "epoch": 1.18, "learning_rate": 0.00012352273464357526, "loss": 0.0095, "step": 108830 }, { "epoch": 1.18, "learning_rate": 0.00012350651877797236, "loss": 0.0117, "step": 108840 }, { "epoch": 1.18, "learning_rate": 0.00012349030291236945, "loss": 0.0088, "step": 108850 }, { "epoch": 1.18, "learning_rate": 0.00012347408704676654, "loss": 0.0101, "step": 108860 }, { "epoch": 1.18, "learning_rate": 0.00012345787118116363, "loss": 0.0093, "step": 108870 }, { "epoch": 1.18, "learning_rate": 0.00012344165531556073, "loss": 0.0113, "step": 108880 }, { "epoch": 1.18, "learning_rate": 0.00012342543944995782, "loss": 0.0112, "step": 108890 }, { "epoch": 1.18, "learning_rate": 0.00012340922358435494, "loss": 0.0094, "step": 108900 }, { "epoch": 1.18, "learning_rate": 0.000123393007718752, "loss": 0.0107, "step": 108910 }, { "epoch": 1.18, "learning_rate": 0.00012337679185314912, "loss": 0.0076, "step": 108920 }, { "epoch": 1.18, "learning_rate": 0.0001233605759875462, "loss": 0.0093, "step": 108930 }, { "epoch": 1.18, "learning_rate": 0.0001233443601219433, "loss": 0.0098, "step": 108940 }, { "epoch": 1.18, "learning_rate": 0.00012332814425634038, "loss": 0.0089, "step": 108950 }, { "epoch": 1.18, "learning_rate": 0.0001233119283907375, "loss": 0.0109, "step": 108960 }, { "epoch": 1.18, "learning_rate": 0.0001232957125251346, "loss": 0.0125, "step": 108970 }, { "epoch": 1.18, "learning_rate": 0.00012327949665953168, "loss": 0.0115, "step": 108980 }, { "epoch": 1.18, "learning_rate": 0.00012326328079392877, "loss": 0.0087, "step": 108990 }, { "epoch": 1.18, "learning_rate": 0.00012324706492832587, "loss": 0.01, "step": 109000 }, { "epoch": 1.18, "eval_cer": 0.9215503867888964, "eval_loss": 0.0077276891097426414, "eval_runtime": 121.2693, "eval_samples_per_second": 16.492, "eval_steps_per_second": 4.123, "step": 109000 }, { "epoch": 1.18, "learning_rate": 0.00012323084906272296, "loss": 0.0112, "step": 109010 }, { "epoch": 1.18, "learning_rate": 0.00012321463319712005, "loss": 0.0103, "step": 109020 }, { "epoch": 1.18, "learning_rate": 0.00012319841733151714, "loss": 0.0109, "step": 109030 }, { "epoch": 1.18, "learning_rate": 0.00012318220146591424, "loss": 0.0112, "step": 109040 }, { "epoch": 1.18, "learning_rate": 0.00012316598560031133, "loss": 0.0085, "step": 109050 }, { "epoch": 1.18, "learning_rate": 0.00012314976973470842, "loss": 0.0077, "step": 109060 }, { "epoch": 1.18, "learning_rate": 0.00012313355386910552, "loss": 0.0089, "step": 109070 }, { "epoch": 1.18, "learning_rate": 0.0001231173380035026, "loss": 0.0102, "step": 109080 }, { "epoch": 1.18, "learning_rate": 0.0001231011221378997, "loss": 0.0101, "step": 109090 }, { "epoch": 1.18, "learning_rate": 0.0001230849062722968, "loss": 0.0109, "step": 109100 }, { "epoch": 1.18, "learning_rate": 0.0001230686904066939, "loss": 0.0082, "step": 109110 }, { "epoch": 1.18, "learning_rate": 0.000123052474541091, "loss": 0.0089, "step": 109120 }, { "epoch": 1.18, "learning_rate": 0.00012303625867548807, "loss": 0.008, "step": 109130 }, { "epoch": 1.18, "learning_rate": 0.0001230200428098852, "loss": 0.0098, "step": 109140 }, { "epoch": 1.18, "learning_rate": 0.00012300382694428226, "loss": 0.0112, "step": 109150 }, { "epoch": 1.18, "learning_rate": 0.00012298761107867938, "loss": 0.0141, "step": 109160 }, { "epoch": 1.18, "learning_rate": 0.00012297139521307647, "loss": 0.0123, "step": 109170 }, { "epoch": 1.18, "learning_rate": 0.00012295517934747356, "loss": 0.0103, "step": 109180 }, { "epoch": 1.18, "learning_rate": 0.00012293896348187066, "loss": 0.0087, "step": 109190 }, { "epoch": 1.18, "learning_rate": 0.00012292274761626775, "loss": 0.0115, "step": 109200 }, { "epoch": 1.18, "learning_rate": 0.00012290653175066484, "loss": 0.0086, "step": 109210 }, { "epoch": 1.18, "learning_rate": 0.00012289031588506193, "loss": 0.0106, "step": 109220 }, { "epoch": 1.18, "learning_rate": 0.00012287410001945903, "loss": 0.0109, "step": 109230 }, { "epoch": 1.18, "learning_rate": 0.00012285788415385612, "loss": 0.0089, "step": 109240 }, { "epoch": 1.18, "learning_rate": 0.0001228416682882532, "loss": 0.0093, "step": 109250 }, { "epoch": 1.18, "learning_rate": 0.0001228254524226503, "loss": 0.0078, "step": 109260 }, { "epoch": 1.18, "learning_rate": 0.0001228092365570474, "loss": 0.0076, "step": 109270 }, { "epoch": 1.18, "learning_rate": 0.0001227930206914445, "loss": 0.0088, "step": 109280 }, { "epoch": 1.18, "learning_rate": 0.00012277680482584158, "loss": 0.0089, "step": 109290 }, { "epoch": 1.18, "learning_rate": 0.00012276058896023868, "loss": 0.0089, "step": 109300 }, { "epoch": 1.18, "learning_rate": 0.00012274437309463577, "loss": 0.0119, "step": 109310 }, { "epoch": 1.18, "learning_rate": 0.0001227281572290329, "loss": 0.0093, "step": 109320 }, { "epoch": 1.18, "learning_rate": 0.00012271194136342995, "loss": 0.0089, "step": 109330 }, { "epoch": 1.18, "learning_rate": 0.00012269572549782707, "loss": 0.0111, "step": 109340 }, { "epoch": 1.18, "learning_rate": 0.00012267950963222417, "loss": 0.009, "step": 109350 }, { "epoch": 1.18, "learning_rate": 0.00012266329376662126, "loss": 0.0093, "step": 109360 }, { "epoch": 1.18, "learning_rate": 0.00012264707790101835, "loss": 0.0103, "step": 109370 }, { "epoch": 1.18, "learning_rate": 0.00012263086203541544, "loss": 0.0117, "step": 109380 }, { "epoch": 1.18, "learning_rate": 0.00012261464616981254, "loss": 0.0101, "step": 109390 }, { "epoch": 1.18, "learning_rate": 0.00012259843030420963, "loss": 0.0092, "step": 109400 }, { "epoch": 1.18, "learning_rate": 0.00012258221443860672, "loss": 0.0107, "step": 109410 }, { "epoch": 1.18, "learning_rate": 0.00012256599857300382, "loss": 0.0105, "step": 109420 }, { "epoch": 1.18, "learning_rate": 0.0001225497827074009, "loss": 0.012, "step": 109430 }, { "epoch": 1.18, "learning_rate": 0.000122533566841798, "loss": 0.012, "step": 109440 }, { "epoch": 1.18, "learning_rate": 0.0001225173509761951, "loss": 0.0113, "step": 109450 }, { "epoch": 1.18, "learning_rate": 0.0001225011351105922, "loss": 0.0104, "step": 109460 }, { "epoch": 1.18, "learning_rate": 0.0001224849192449893, "loss": 0.0115, "step": 109470 }, { "epoch": 1.18, "learning_rate": 0.00012246870337938637, "loss": 0.0119, "step": 109480 }, { "epoch": 1.18, "learning_rate": 0.0001224524875137835, "loss": 0.009, "step": 109490 }, { "epoch": 1.18, "learning_rate": 0.00012243627164818056, "loss": 0.0081, "step": 109500 }, { "epoch": 1.18, "learning_rate": 0.00012242005578257768, "loss": 0.0088, "step": 109510 }, { "epoch": 1.18, "learning_rate": 0.00012240383991697474, "loss": 0.0099, "step": 109520 }, { "epoch": 1.18, "learning_rate": 0.00012238762405137186, "loss": 0.0083, "step": 109530 }, { "epoch": 1.18, "learning_rate": 0.00012237140818576896, "loss": 0.0103, "step": 109540 }, { "epoch": 1.18, "learning_rate": 0.00012235519232016605, "loss": 0.0115, "step": 109550 }, { "epoch": 1.18, "learning_rate": 0.00012233897645456314, "loss": 0.0092, "step": 109560 }, { "epoch": 1.18, "learning_rate": 0.00012232276058896023, "loss": 0.0103, "step": 109570 }, { "epoch": 1.18, "learning_rate": 0.00012230654472335733, "loss": 0.0122, "step": 109580 }, { "epoch": 1.18, "learning_rate": 0.00012229032885775442, "loss": 0.0114, "step": 109590 }, { "epoch": 1.18, "learning_rate": 0.0001222741129921515, "loss": 0.0105, "step": 109600 }, { "epoch": 1.18, "learning_rate": 0.0001222578971265486, "loss": 0.0099, "step": 109610 }, { "epoch": 1.19, "learning_rate": 0.0001222416812609457, "loss": 0.0085, "step": 109620 }, { "epoch": 1.19, "learning_rate": 0.0001222254653953428, "loss": 0.0101, "step": 109630 }, { "epoch": 1.19, "learning_rate": 0.00012220924952973988, "loss": 0.0091, "step": 109640 }, { "epoch": 1.19, "learning_rate": 0.00012219303366413698, "loss": 0.0127, "step": 109650 }, { "epoch": 1.19, "learning_rate": 0.00012217681779853407, "loss": 0.0102, "step": 109660 }, { "epoch": 1.19, "learning_rate": 0.00012216060193293116, "loss": 0.0086, "step": 109670 }, { "epoch": 1.19, "learning_rate": 0.00012214438606732825, "loss": 0.0101, "step": 109680 }, { "epoch": 1.19, "learning_rate": 0.00012212817020172537, "loss": 0.0093, "step": 109690 }, { "epoch": 1.19, "learning_rate": 0.00012211195433612244, "loss": 0.0099, "step": 109700 }, { "epoch": 1.19, "learning_rate": 0.00012209573847051956, "loss": 0.0099, "step": 109710 }, { "epoch": 1.19, "learning_rate": 0.00012207952260491663, "loss": 0.0091, "step": 109720 }, { "epoch": 1.19, "learning_rate": 0.00012206330673931373, "loss": 0.0112, "step": 109730 }, { "epoch": 1.19, "learning_rate": 0.00012204709087371082, "loss": 0.0126, "step": 109740 }, { "epoch": 1.19, "learning_rate": 0.00012203087500810793, "loss": 0.0132, "step": 109750 }, { "epoch": 1.19, "learning_rate": 0.00012201465914250501, "loss": 0.0087, "step": 109760 }, { "epoch": 1.19, "learning_rate": 0.00012199844327690212, "loss": 0.0083, "step": 109770 }, { "epoch": 1.19, "learning_rate": 0.0001219822274112992, "loss": 0.0095, "step": 109780 }, { "epoch": 1.19, "learning_rate": 0.0001219660115456963, "loss": 0.0073, "step": 109790 }, { "epoch": 1.19, "learning_rate": 0.00012194979568009338, "loss": 0.0116, "step": 109800 }, { "epoch": 1.19, "learning_rate": 0.00012193357981449049, "loss": 0.0094, "step": 109810 }, { "epoch": 1.19, "learning_rate": 0.00012191736394888758, "loss": 0.0096, "step": 109820 }, { "epoch": 1.19, "learning_rate": 0.00012190114808328467, "loss": 0.0085, "step": 109830 }, { "epoch": 1.19, "learning_rate": 0.00012188493221768177, "loss": 0.0084, "step": 109840 }, { "epoch": 1.19, "learning_rate": 0.00012186871635207887, "loss": 0.0102, "step": 109850 }, { "epoch": 1.19, "learning_rate": 0.00012185250048647595, "loss": 0.012, "step": 109860 }, { "epoch": 1.19, "learning_rate": 0.00012183628462087306, "loss": 0.0129, "step": 109870 }, { "epoch": 1.19, "learning_rate": 0.00012182006875527014, "loss": 0.0091, "step": 109880 }, { "epoch": 1.19, "learning_rate": 0.00012180385288966724, "loss": 0.0122, "step": 109890 }, { "epoch": 1.19, "learning_rate": 0.00012178763702406432, "loss": 0.0071, "step": 109900 }, { "epoch": 1.19, "learning_rate": 0.00012177142115846143, "loss": 0.0104, "step": 109910 }, { "epoch": 1.19, "learning_rate": 0.00012175520529285852, "loss": 0.0102, "step": 109920 }, { "epoch": 1.19, "learning_rate": 0.00012173898942725561, "loss": 0.0079, "step": 109930 }, { "epoch": 1.19, "learning_rate": 0.0001217227735616527, "loss": 0.0085, "step": 109940 }, { "epoch": 1.19, "learning_rate": 0.0001217065576960498, "loss": 0.0087, "step": 109950 }, { "epoch": 1.19, "learning_rate": 0.00012169034183044689, "loss": 0.0084, "step": 109960 }, { "epoch": 1.19, "learning_rate": 0.000121674125964844, "loss": 0.0124, "step": 109970 }, { "epoch": 1.19, "learning_rate": 0.00012165791009924108, "loss": 0.0087, "step": 109980 }, { "epoch": 1.19, "learning_rate": 0.00012164169423363818, "loss": 0.0103, "step": 109990 }, { "epoch": 1.19, "learning_rate": 0.00012162547836803526, "loss": 0.0112, "step": 110000 }, { "epoch": 1.19, "eval_cer": 0.9215582042155038, "eval_loss": 0.007691715378314257, "eval_runtime": 121.2349, "eval_samples_per_second": 16.497, "eval_steps_per_second": 4.124, "step": 110000 }, { "epoch": 1.19, "learning_rate": 0.00012160926250243237, "loss": 0.0104, "step": 110010 }, { "epoch": 1.19, "learning_rate": 0.00012159304663682946, "loss": 0.0125, "step": 110020 }, { "epoch": 1.19, "learning_rate": 0.00012157683077122655, "loss": 0.0101, "step": 110030 }, { "epoch": 1.19, "learning_rate": 0.00012156061490562365, "loss": 0.0124, "step": 110040 }, { "epoch": 1.19, "learning_rate": 0.00012154439904002074, "loss": 0.0086, "step": 110050 }, { "epoch": 1.19, "learning_rate": 0.00012152818317441785, "loss": 0.0079, "step": 110060 }, { "epoch": 1.19, "learning_rate": 0.00012151196730881494, "loss": 0.0072, "step": 110070 }, { "epoch": 1.19, "learning_rate": 0.00012149575144321203, "loss": 0.0113, "step": 110080 }, { "epoch": 1.19, "learning_rate": 0.00012147953557760912, "loss": 0.0108, "step": 110090 }, { "epoch": 1.19, "learning_rate": 0.00012146331971200622, "loss": 0.0124, "step": 110100 }, { "epoch": 1.19, "learning_rate": 0.00012144710384640331, "loss": 0.0135, "step": 110110 }, { "epoch": 1.19, "learning_rate": 0.00012143088798080042, "loss": 0.0127, "step": 110120 }, { "epoch": 1.19, "learning_rate": 0.0001214146721151975, "loss": 0.0101, "step": 110130 }, { "epoch": 1.19, "learning_rate": 0.0001213984562495946, "loss": 0.01, "step": 110140 }, { "epoch": 1.19, "learning_rate": 0.00012138224038399168, "loss": 0.0099, "step": 110150 }, { "epoch": 1.19, "learning_rate": 0.00012136602451838879, "loss": 0.0107, "step": 110160 }, { "epoch": 1.19, "learning_rate": 0.00012134980865278588, "loss": 0.0091, "step": 110170 }, { "epoch": 1.19, "learning_rate": 0.00012133359278718297, "loss": 0.0096, "step": 110180 }, { "epoch": 1.19, "learning_rate": 0.00012131737692158007, "loss": 0.0086, "step": 110190 }, { "epoch": 1.19, "learning_rate": 0.00012130116105597716, "loss": 0.0115, "step": 110200 }, { "epoch": 1.19, "learning_rate": 0.00012128494519037425, "loss": 0.0098, "step": 110210 }, { "epoch": 1.19, "learning_rate": 0.00012126872932477136, "loss": 0.0098, "step": 110220 }, { "epoch": 1.19, "learning_rate": 0.00012125251345916844, "loss": 0.0116, "step": 110230 }, { "epoch": 1.19, "learning_rate": 0.00012123629759356554, "loss": 0.011, "step": 110240 }, { "epoch": 1.19, "learning_rate": 0.00012122008172796262, "loss": 0.0112, "step": 110250 }, { "epoch": 1.19, "learning_rate": 0.00012120386586235973, "loss": 0.0098, "step": 110260 }, { "epoch": 1.19, "learning_rate": 0.00012118764999675681, "loss": 0.0093, "step": 110270 }, { "epoch": 1.19, "learning_rate": 0.00012117143413115391, "loss": 0.0088, "step": 110280 }, { "epoch": 1.19, "learning_rate": 0.000121155218265551, "loss": 0.0089, "step": 110290 }, { "epoch": 1.19, "learning_rate": 0.0001211390023999481, "loss": 0.008, "step": 110300 }, { "epoch": 1.19, "learning_rate": 0.00012112278653434519, "loss": 0.0086, "step": 110310 }, { "epoch": 1.19, "learning_rate": 0.0001211065706687423, "loss": 0.0103, "step": 110320 }, { "epoch": 1.19, "learning_rate": 0.00012109035480313938, "loss": 0.0091, "step": 110330 }, { "epoch": 1.19, "learning_rate": 0.00012107413893753648, "loss": 0.0137, "step": 110340 }, { "epoch": 1.19, "learning_rate": 0.00012105792307193356, "loss": 0.0095, "step": 110350 }, { "epoch": 1.19, "learning_rate": 0.00012104170720633067, "loss": 0.0081, "step": 110360 }, { "epoch": 1.19, "learning_rate": 0.00012102549134072775, "loss": 0.0106, "step": 110370 }, { "epoch": 1.19, "learning_rate": 0.00012100927547512485, "loss": 0.0072, "step": 110380 }, { "epoch": 1.19, "learning_rate": 0.00012099305960952195, "loss": 0.01, "step": 110390 }, { "epoch": 1.19, "learning_rate": 0.00012097684374391904, "loss": 0.01, "step": 110400 }, { "epoch": 1.19, "learning_rate": 0.00012096062787831613, "loss": 0.0064, "step": 110410 }, { "epoch": 1.19, "learning_rate": 0.00012094441201271323, "loss": 0.0088, "step": 110420 }, { "epoch": 1.19, "learning_rate": 0.00012092819614711032, "loss": 0.0084, "step": 110430 }, { "epoch": 1.19, "learning_rate": 0.00012091198028150742, "loss": 0.0069, "step": 110440 }, { "epoch": 1.19, "learning_rate": 0.0001208957644159045, "loss": 0.0092, "step": 110450 }, { "epoch": 1.19, "learning_rate": 0.00012087954855030161, "loss": 0.0087, "step": 110460 }, { "epoch": 1.19, "learning_rate": 0.00012086333268469869, "loss": 0.0082, "step": 110470 }, { "epoch": 1.19, "learning_rate": 0.0001208471168190958, "loss": 0.0087, "step": 110480 }, { "epoch": 1.19, "learning_rate": 0.00012083090095349289, "loss": 0.0101, "step": 110490 }, { "epoch": 1.19, "learning_rate": 0.00012081468508788998, "loss": 0.017, "step": 110500 }, { "epoch": 1.19, "learning_rate": 0.00012079846922228707, "loss": 0.0102, "step": 110510 }, { "epoch": 1.19, "learning_rate": 0.00012078225335668417, "loss": 0.0066, "step": 110520 }, { "epoch": 1.19, "learning_rate": 0.00012076603749108126, "loss": 0.0093, "step": 110530 }, { "epoch": 1.19, "learning_rate": 0.00012074982162547837, "loss": 0.009, "step": 110540 }, { "epoch": 1.2, "learning_rate": 0.00012073360575987544, "loss": 0.0079, "step": 110550 }, { "epoch": 1.2, "learning_rate": 0.00012071738989427255, "loss": 0.0084, "step": 110560 }, { "epoch": 1.2, "learning_rate": 0.00012070117402866963, "loss": 0.0082, "step": 110570 }, { "epoch": 1.2, "learning_rate": 0.00012068495816306674, "loss": 0.0092, "step": 110580 }, { "epoch": 1.2, "learning_rate": 0.00012066874229746382, "loss": 0.0126, "step": 110590 }, { "epoch": 1.2, "learning_rate": 0.00012065252643186092, "loss": 0.0112, "step": 110600 }, { "epoch": 1.2, "learning_rate": 0.00012063631056625801, "loss": 0.0095, "step": 110610 }, { "epoch": 1.2, "learning_rate": 0.00012062009470065511, "loss": 0.011, "step": 110620 }, { "epoch": 1.2, "learning_rate": 0.0001206038788350522, "loss": 0.0089, "step": 110630 }, { "epoch": 1.2, "learning_rate": 0.0001205876629694493, "loss": 0.0093, "step": 110640 }, { "epoch": 1.2, "learning_rate": 0.00012057144710384639, "loss": 0.0094, "step": 110650 }, { "epoch": 1.2, "learning_rate": 0.00012055523123824349, "loss": 0.0081, "step": 110660 }, { "epoch": 1.2, "learning_rate": 0.00012053901537264057, "loss": 0.0088, "step": 110670 }, { "epoch": 1.2, "learning_rate": 0.00012052279950703768, "loss": 0.009, "step": 110680 }, { "epoch": 1.2, "learning_rate": 0.00012050658364143476, "loss": 0.0071, "step": 110690 }, { "epoch": 1.2, "learning_rate": 0.00012049036777583186, "loss": 0.0091, "step": 110700 }, { "epoch": 1.2, "learning_rate": 0.00012047415191022896, "loss": 0.0099, "step": 110710 }, { "epoch": 1.2, "learning_rate": 0.00012045793604462605, "loss": 0.0085, "step": 110720 }, { "epoch": 1.2, "learning_rate": 0.00012044172017902314, "loss": 0.0094, "step": 110730 }, { "epoch": 1.2, "learning_rate": 0.00012042550431342023, "loss": 0.0123, "step": 110740 }, { "epoch": 1.2, "learning_rate": 0.00012040928844781733, "loss": 0.0103, "step": 110750 }, { "epoch": 1.2, "learning_rate": 0.00012039307258221443, "loss": 0.0096, "step": 110760 }, { "epoch": 1.2, "learning_rate": 0.00012037685671661151, "loss": 0.0097, "step": 110770 }, { "epoch": 1.2, "learning_rate": 0.00012036064085100862, "loss": 0.0095, "step": 110780 }, { "epoch": 1.2, "learning_rate": 0.00012034442498540572, "loss": 0.0103, "step": 110790 }, { "epoch": 1.2, "learning_rate": 0.0001203282091198028, "loss": 0.0112, "step": 110800 }, { "epoch": 1.2, "learning_rate": 0.00012031199325419991, "loss": 0.0081, "step": 110810 }, { "epoch": 1.2, "learning_rate": 0.00012029577738859699, "loss": 0.0091, "step": 110820 }, { "epoch": 1.2, "learning_rate": 0.0001202795615229941, "loss": 0.0086, "step": 110830 }, { "epoch": 1.2, "learning_rate": 0.00012026334565739118, "loss": 0.0109, "step": 110840 }, { "epoch": 1.2, "learning_rate": 0.00012024712979178828, "loss": 0.0108, "step": 110850 }, { "epoch": 1.2, "learning_rate": 0.00012023091392618537, "loss": 0.0099, "step": 110860 }, { "epoch": 1.2, "learning_rate": 0.00012021469806058247, "loss": 0.0089, "step": 110870 }, { "epoch": 1.2, "learning_rate": 0.00012019848219497956, "loss": 0.0102, "step": 110880 }, { "epoch": 1.2, "learning_rate": 0.00012018226632937665, "loss": 0.0102, "step": 110890 }, { "epoch": 1.2, "learning_rate": 0.00012016605046377375, "loss": 0.0105, "step": 110900 }, { "epoch": 1.2, "learning_rate": 0.00012014983459817085, "loss": 0.0118, "step": 110910 }, { "epoch": 1.2, "learning_rate": 0.00012013361873256793, "loss": 0.0089, "step": 110920 }, { "epoch": 1.2, "learning_rate": 0.00012011740286696504, "loss": 0.0098, "step": 110930 }, { "epoch": 1.2, "learning_rate": 0.00012010118700136212, "loss": 0.0092, "step": 110940 }, { "epoch": 1.2, "learning_rate": 0.00012008497113575922, "loss": 0.0098, "step": 110950 }, { "epoch": 1.2, "learning_rate": 0.0001200687552701563, "loss": 0.0069, "step": 110960 }, { "epoch": 1.2, "learning_rate": 0.00012005253940455341, "loss": 0.0113, "step": 110970 }, { "epoch": 1.2, "learning_rate": 0.0001200363235389505, "loss": 0.0122, "step": 110980 }, { "epoch": 1.2, "learning_rate": 0.0001200201076733476, "loss": 0.0119, "step": 110990 }, { "epoch": 1.2, "learning_rate": 0.00012000389180774469, "loss": 0.0092, "step": 111000 }, { "epoch": 1.2, "eval_cer": 0.9215321461268126, "eval_loss": 0.0076298159547150135, "eval_runtime": 121.3154, "eval_samples_per_second": 16.486, "eval_steps_per_second": 4.121, "step": 111000 }, { "epoch": 1.2, "learning_rate": 0.00011998767594214179, "loss": 0.0091, "step": 111010 }, { "epoch": 1.2, "learning_rate": 0.00011997146007653887, "loss": 0.0093, "step": 111020 }, { "epoch": 1.2, "learning_rate": 0.00011995524421093598, "loss": 0.0133, "step": 111030 }, { "epoch": 1.2, "learning_rate": 0.00011993902834533306, "loss": 0.0082, "step": 111040 }, { "epoch": 1.2, "learning_rate": 0.00011992281247973016, "loss": 0.0125, "step": 111050 }, { "epoch": 1.2, "learning_rate": 0.00011990659661412724, "loss": 0.0111, "step": 111060 }, { "epoch": 1.2, "learning_rate": 0.00011989038074852435, "loss": 0.0124, "step": 111070 }, { "epoch": 1.2, "learning_rate": 0.00011987416488292144, "loss": 0.0097, "step": 111080 }, { "epoch": 1.2, "learning_rate": 0.00011985794901731853, "loss": 0.0086, "step": 111090 }, { "epoch": 1.2, "learning_rate": 0.00011984173315171563, "loss": 0.0114, "step": 111100 }, { "epoch": 1.2, "learning_rate": 0.00011982551728611272, "loss": 0.0121, "step": 111110 }, { "epoch": 1.2, "learning_rate": 0.00011980930142050981, "loss": 0.0088, "step": 111120 }, { "epoch": 1.2, "learning_rate": 0.00011979308555490692, "loss": 0.0119, "step": 111130 }, { "epoch": 1.2, "learning_rate": 0.000119776869689304, "loss": 0.0099, "step": 111140 }, { "epoch": 1.2, "learning_rate": 0.0001197606538237011, "loss": 0.01, "step": 111150 }, { "epoch": 1.2, "learning_rate": 0.00011974443795809818, "loss": 0.0086, "step": 111160 }, { "epoch": 1.2, "learning_rate": 0.00011972822209249529, "loss": 0.0089, "step": 111170 }, { "epoch": 1.2, "learning_rate": 0.00011971200622689238, "loss": 0.0103, "step": 111180 }, { "epoch": 1.2, "learning_rate": 0.00011969579036128948, "loss": 0.0117, "step": 111190 }, { "epoch": 1.2, "learning_rate": 0.00011967957449568657, "loss": 0.0096, "step": 111200 }, { "epoch": 1.2, "learning_rate": 0.00011966335863008366, "loss": 0.0114, "step": 111210 }, { "epoch": 1.2, "learning_rate": 0.00011964714276448075, "loss": 0.0113, "step": 111220 }, { "epoch": 1.2, "learning_rate": 0.00011963092689887786, "loss": 0.0094, "step": 111230 }, { "epoch": 1.2, "learning_rate": 0.00011961471103327494, "loss": 0.0073, "step": 111240 }, { "epoch": 1.2, "learning_rate": 0.00011959849516767205, "loss": 0.0096, "step": 111250 }, { "epoch": 1.2, "learning_rate": 0.00011958227930206912, "loss": 0.0094, "step": 111260 }, { "epoch": 1.2, "learning_rate": 0.00011956606343646623, "loss": 0.0098, "step": 111270 }, { "epoch": 1.2, "learning_rate": 0.00011954984757086331, "loss": 0.013, "step": 111280 }, { "epoch": 1.2, "learning_rate": 0.00011953363170526042, "loss": 0.0117, "step": 111290 }, { "epoch": 1.2, "learning_rate": 0.00011951741583965751, "loss": 0.0116, "step": 111300 }, { "epoch": 1.2, "learning_rate": 0.0001195011999740546, "loss": 0.0085, "step": 111310 }, { "epoch": 1.2, "learning_rate": 0.0001194849841084517, "loss": 0.0122, "step": 111320 }, { "epoch": 1.2, "learning_rate": 0.0001194687682428488, "loss": 0.0132, "step": 111330 }, { "epoch": 1.2, "learning_rate": 0.00011945255237724588, "loss": 0.0133, "step": 111340 }, { "epoch": 1.2, "learning_rate": 0.00011943633651164299, "loss": 0.0101, "step": 111350 }, { "epoch": 1.2, "learning_rate": 0.00011942012064604007, "loss": 0.0097, "step": 111360 }, { "epoch": 1.2, "learning_rate": 0.00011940390478043717, "loss": 0.0147, "step": 111370 }, { "epoch": 1.2, "learning_rate": 0.00011938768891483425, "loss": 0.0106, "step": 111380 }, { "epoch": 1.2, "learning_rate": 0.00011937147304923136, "loss": 0.0124, "step": 111390 }, { "epoch": 1.2, "learning_rate": 0.00011935525718362845, "loss": 0.0102, "step": 111400 }, { "epoch": 1.2, "learning_rate": 0.00011933904131802554, "loss": 0.0115, "step": 111410 }, { "epoch": 1.2, "learning_rate": 0.00011932282545242264, "loss": 0.0121, "step": 111420 }, { "epoch": 1.2, "learning_rate": 0.00011930660958681973, "loss": 0.0081, "step": 111430 }, { "epoch": 1.2, "learning_rate": 0.00011929039372121682, "loss": 0.0085, "step": 111440 }, { "epoch": 1.2, "learning_rate": 0.00011927417785561393, "loss": 0.0135, "step": 111450 }, { "epoch": 1.2, "learning_rate": 0.000119257961990011, "loss": 0.0108, "step": 111460 }, { "epoch": 1.21, "learning_rate": 0.00011924174612440811, "loss": 0.0081, "step": 111470 }, { "epoch": 1.21, "learning_rate": 0.00011922553025880519, "loss": 0.0115, "step": 111480 }, { "epoch": 1.21, "learning_rate": 0.0001192093143932023, "loss": 0.0089, "step": 111490 }, { "epoch": 1.21, "learning_rate": 0.0001191930985275994, "loss": 0.0095, "step": 111500 }, { "epoch": 1.21, "learning_rate": 0.00011917688266199648, "loss": 0.0075, "step": 111510 }, { "epoch": 1.21, "learning_rate": 0.00011916066679639359, "loss": 0.0128, "step": 111520 }, { "epoch": 1.21, "learning_rate": 0.00011914445093079067, "loss": 0.0094, "step": 111530 }, { "epoch": 1.21, "learning_rate": 0.00011912823506518778, "loss": 0.0095, "step": 111540 }, { "epoch": 1.21, "learning_rate": 0.00011911201919958487, "loss": 0.0093, "step": 111550 }, { "epoch": 1.21, "learning_rate": 0.00011909580333398196, "loss": 0.0095, "step": 111560 }, { "epoch": 1.21, "learning_rate": 0.00011907958746837905, "loss": 0.0083, "step": 111570 }, { "epoch": 1.21, "learning_rate": 0.00011906337160277615, "loss": 0.0092, "step": 111580 }, { "epoch": 1.21, "learning_rate": 0.00011904715573717324, "loss": 0.0116, "step": 111590 }, { "epoch": 1.21, "learning_rate": 0.00011903093987157035, "loss": 0.0092, "step": 111600 }, { "epoch": 1.21, "learning_rate": 0.00011901472400596742, "loss": 0.0097, "step": 111610 }, { "epoch": 1.21, "learning_rate": 0.00011899850814036453, "loss": 0.009, "step": 111620 }, { "epoch": 1.21, "learning_rate": 0.00011898229227476161, "loss": 0.0096, "step": 111630 }, { "epoch": 1.21, "learning_rate": 0.00011896607640915872, "loss": 0.0092, "step": 111640 }, { "epoch": 1.21, "learning_rate": 0.00011894986054355581, "loss": 0.0098, "step": 111650 }, { "epoch": 1.21, "learning_rate": 0.0001189336446779529, "loss": 0.0109, "step": 111660 }, { "epoch": 1.21, "learning_rate": 0.00011891742881235, "loss": 0.0108, "step": 111670 }, { "epoch": 1.21, "learning_rate": 0.00011890121294674709, "loss": 0.0097, "step": 111680 }, { "epoch": 1.21, "learning_rate": 0.00011888499708114418, "loss": 0.0082, "step": 111690 }, { "epoch": 1.21, "learning_rate": 0.00011886878121554129, "loss": 0.0112, "step": 111700 }, { "epoch": 1.21, "learning_rate": 0.00011885256534993837, "loss": 0.0093, "step": 111710 }, { "epoch": 1.21, "learning_rate": 0.00011883634948433547, "loss": 0.0089, "step": 111720 }, { "epoch": 1.21, "learning_rate": 0.00011882013361873255, "loss": 0.0095, "step": 111730 }, { "epoch": 1.21, "learning_rate": 0.00011880391775312966, "loss": 0.0095, "step": 111740 }, { "epoch": 1.21, "learning_rate": 0.00011878770188752674, "loss": 0.0121, "step": 111750 }, { "epoch": 1.21, "learning_rate": 0.00011877148602192384, "loss": 0.0089, "step": 111760 }, { "epoch": 1.21, "learning_rate": 0.00011875527015632094, "loss": 0.0111, "step": 111770 }, { "epoch": 1.21, "learning_rate": 0.00011873905429071803, "loss": 0.0106, "step": 111780 }, { "epoch": 1.21, "learning_rate": 0.00011872283842511512, "loss": 0.0095, "step": 111790 }, { "epoch": 1.21, "learning_rate": 0.00011870662255951223, "loss": 0.0116, "step": 111800 }, { "epoch": 1.21, "learning_rate": 0.00011869040669390931, "loss": 0.0108, "step": 111810 }, { "epoch": 1.21, "learning_rate": 0.00011867419082830641, "loss": 0.0133, "step": 111820 }, { "epoch": 1.21, "learning_rate": 0.00011865797496270349, "loss": 0.0094, "step": 111830 }, { "epoch": 1.21, "learning_rate": 0.0001186417590971006, "loss": 0.009, "step": 111840 }, { "epoch": 1.21, "learning_rate": 0.00011862554323149768, "loss": 0.0109, "step": 111850 }, { "epoch": 1.21, "learning_rate": 0.00011860932736589478, "loss": 0.009, "step": 111860 }, { "epoch": 1.21, "learning_rate": 0.00011859311150029188, "loss": 0.0104, "step": 111870 }, { "epoch": 1.21, "learning_rate": 0.00011857689563468897, "loss": 0.0084, "step": 111880 }, { "epoch": 1.21, "learning_rate": 0.00011856067976908606, "loss": 0.0082, "step": 111890 }, { "epoch": 1.21, "learning_rate": 0.00011854446390348316, "loss": 0.009, "step": 111900 }, { "epoch": 1.21, "learning_rate": 0.00011852824803788025, "loss": 0.0088, "step": 111910 }, { "epoch": 1.21, "learning_rate": 0.00011851203217227735, "loss": 0.0114, "step": 111920 }, { "epoch": 1.21, "learning_rate": 0.00011849581630667443, "loss": 0.0121, "step": 111930 }, { "epoch": 1.21, "learning_rate": 0.00011847960044107154, "loss": 0.0109, "step": 111940 }, { "epoch": 1.21, "learning_rate": 0.00011846338457546862, "loss": 0.0084, "step": 111950 }, { "epoch": 1.21, "learning_rate": 0.00011844716870986573, "loss": 0.0101, "step": 111960 }, { "epoch": 1.21, "learning_rate": 0.0001184309528442628, "loss": 0.0111, "step": 111970 }, { "epoch": 1.21, "learning_rate": 0.00011841473697865991, "loss": 0.0101, "step": 111980 }, { "epoch": 1.21, "learning_rate": 0.000118398521113057, "loss": 0.0117, "step": 111990 }, { "epoch": 1.21, "learning_rate": 0.0001183823052474541, "loss": 0.0097, "step": 112000 }, { "epoch": 1.21, "eval_cer": 0.9215408321563763, "eval_loss": 0.007726356852799654, "eval_runtime": 121.0775, "eval_samples_per_second": 16.518, "eval_steps_per_second": 4.13, "step": 112000 }, { "epoch": 1.21, "learning_rate": 0.00011836608938185119, "loss": 0.011, "step": 112010 }, { "epoch": 1.21, "learning_rate": 0.0001183498735162483, "loss": 0.0099, "step": 112020 }, { "epoch": 1.21, "learning_rate": 0.00011833365765064537, "loss": 0.0086, "step": 112030 }, { "epoch": 1.21, "learning_rate": 0.00011831744178504248, "loss": 0.0088, "step": 112040 }, { "epoch": 1.21, "learning_rate": 0.00011830122591943956, "loss": 0.0082, "step": 112050 }, { "epoch": 1.21, "learning_rate": 0.00011828501005383667, "loss": 0.0118, "step": 112060 }, { "epoch": 1.21, "learning_rate": 0.00011826879418823375, "loss": 0.0086, "step": 112070 }, { "epoch": 1.21, "learning_rate": 0.00011825257832263085, "loss": 0.0103, "step": 112080 }, { "epoch": 1.21, "learning_rate": 0.00011823636245702794, "loss": 0.0096, "step": 112090 }, { "epoch": 1.21, "learning_rate": 0.00011822014659142504, "loss": 0.0102, "step": 112100 }, { "epoch": 1.21, "learning_rate": 0.00011820393072582213, "loss": 0.0105, "step": 112110 }, { "epoch": 1.21, "learning_rate": 0.00011818771486021922, "loss": 0.0085, "step": 112120 }, { "epoch": 1.21, "learning_rate": 0.00011817149899461632, "loss": 0.0083, "step": 112130 }, { "epoch": 1.21, "learning_rate": 0.00011815528312901342, "loss": 0.0117, "step": 112140 }, { "epoch": 1.21, "learning_rate": 0.0001181390672634105, "loss": 0.0107, "step": 112150 }, { "epoch": 1.21, "learning_rate": 0.00011812285139780761, "loss": 0.0076, "step": 112160 }, { "epoch": 1.21, "learning_rate": 0.00011810663553220469, "loss": 0.0096, "step": 112170 }, { "epoch": 1.21, "learning_rate": 0.00011809041966660179, "loss": 0.0099, "step": 112180 }, { "epoch": 1.21, "learning_rate": 0.00011807420380099889, "loss": 0.0083, "step": 112190 }, { "epoch": 1.21, "learning_rate": 0.00011805798793539598, "loss": 0.01, "step": 112200 }, { "epoch": 1.21, "learning_rate": 0.00011804177206979307, "loss": 0.0104, "step": 112210 }, { "epoch": 1.21, "learning_rate": 0.00011802555620419016, "loss": 0.0093, "step": 112220 }, { "epoch": 1.21, "learning_rate": 0.00011800934033858727, "loss": 0.0109, "step": 112230 }, { "epoch": 1.21, "learning_rate": 0.00011799312447298436, "loss": 0.0091, "step": 112240 }, { "epoch": 1.21, "learning_rate": 0.00011797690860738146, "loss": 0.0088, "step": 112250 }, { "epoch": 1.21, "learning_rate": 0.00011796069274177855, "loss": 0.0093, "step": 112260 }, { "epoch": 1.21, "learning_rate": 0.00011794447687617565, "loss": 0.0103, "step": 112270 }, { "epoch": 1.21, "learning_rate": 0.00011792826101057273, "loss": 0.0097, "step": 112280 }, { "epoch": 1.21, "learning_rate": 0.00011791204514496984, "loss": 0.0096, "step": 112290 }, { "epoch": 1.21, "learning_rate": 0.00011789582927936692, "loss": 0.0114, "step": 112300 }, { "epoch": 1.21, "learning_rate": 0.00011787961341376403, "loss": 0.0101, "step": 112310 }, { "epoch": 1.21, "learning_rate": 0.0001178633975481611, "loss": 0.0119, "step": 112320 }, { "epoch": 1.21, "learning_rate": 0.00011784718168255821, "loss": 0.0079, "step": 112330 }, { "epoch": 1.21, "learning_rate": 0.0001178309658169553, "loss": 0.0085, "step": 112340 }, { "epoch": 1.21, "learning_rate": 0.0001178147499513524, "loss": 0.0101, "step": 112350 }, { "epoch": 1.21, "learning_rate": 0.00011779853408574949, "loss": 0.0131, "step": 112360 }, { "epoch": 1.21, "learning_rate": 0.00011778231822014658, "loss": 0.0078, "step": 112370 }, { "epoch": 1.21, "learning_rate": 0.00011776610235454367, "loss": 0.01, "step": 112380 }, { "epoch": 1.21, "learning_rate": 0.00011774988648894078, "loss": 0.0092, "step": 112390 }, { "epoch": 1.22, "learning_rate": 0.00011773367062333786, "loss": 0.0081, "step": 112400 }, { "epoch": 1.22, "learning_rate": 0.00011771745475773497, "loss": 0.0091, "step": 112410 }, { "epoch": 1.22, "learning_rate": 0.00011770123889213205, "loss": 0.0086, "step": 112420 }, { "epoch": 1.22, "learning_rate": 0.00011768502302652915, "loss": 0.0109, "step": 112430 }, { "epoch": 1.22, "learning_rate": 0.00011766880716092623, "loss": 0.0084, "step": 112440 }, { "epoch": 1.22, "learning_rate": 0.00011765259129532334, "loss": 0.01, "step": 112450 }, { "epoch": 1.22, "learning_rate": 0.00011763637542972043, "loss": 0.0088, "step": 112460 }, { "epoch": 1.22, "learning_rate": 0.00011762015956411752, "loss": 0.0073, "step": 112470 }, { "epoch": 1.22, "learning_rate": 0.00011760394369851462, "loss": 0.0092, "step": 112480 }, { "epoch": 1.22, "learning_rate": 0.00011758772783291172, "loss": 0.0079, "step": 112490 }, { "epoch": 1.22, "learning_rate": 0.0001175715119673088, "loss": 0.0078, "step": 112500 }, { "epoch": 1.22, "learning_rate": 0.00011755529610170591, "loss": 0.0065, "step": 112510 }, { "epoch": 1.22, "learning_rate": 0.00011753908023610299, "loss": 0.0104, "step": 112520 }, { "epoch": 1.22, "learning_rate": 0.00011752286437050009, "loss": 0.01, "step": 112530 }, { "epoch": 1.22, "learning_rate": 0.00011750664850489717, "loss": 0.0109, "step": 112540 }, { "epoch": 1.22, "learning_rate": 0.00011749043263929428, "loss": 0.0092, "step": 112550 }, { "epoch": 1.22, "learning_rate": 0.00011747421677369137, "loss": 0.0102, "step": 112560 }, { "epoch": 1.22, "learning_rate": 0.00011745800090808846, "loss": 0.0117, "step": 112570 }, { "epoch": 1.22, "learning_rate": 0.00011744178504248556, "loss": 0.0094, "step": 112580 }, { "epoch": 1.22, "learning_rate": 0.00011742556917688265, "loss": 0.009, "step": 112590 }, { "epoch": 1.22, "learning_rate": 0.00011740935331127974, "loss": 0.0077, "step": 112600 }, { "epoch": 1.22, "learning_rate": 0.00011739313744567685, "loss": 0.0097, "step": 112610 }, { "epoch": 1.22, "learning_rate": 0.00011737692158007393, "loss": 0.0075, "step": 112620 }, { "epoch": 1.22, "learning_rate": 0.00011736070571447103, "loss": 0.0106, "step": 112630 }, { "epoch": 1.22, "learning_rate": 0.00011734448984886811, "loss": 0.0078, "step": 112640 }, { "epoch": 1.22, "learning_rate": 0.00011732827398326522, "loss": 0.0108, "step": 112650 }, { "epoch": 1.22, "learning_rate": 0.00011731205811766231, "loss": 0.0115, "step": 112660 }, { "epoch": 1.22, "learning_rate": 0.0001172958422520594, "loss": 0.011, "step": 112670 }, { "epoch": 1.22, "learning_rate": 0.0001172796263864565, "loss": 0.0094, "step": 112680 }, { "epoch": 1.22, "learning_rate": 0.00011726341052085359, "loss": 0.0125, "step": 112690 }, { "epoch": 1.22, "learning_rate": 0.00011724719465525068, "loss": 0.0086, "step": 112700 }, { "epoch": 1.22, "learning_rate": 0.00011723097878964779, "loss": 0.0115, "step": 112710 }, { "epoch": 1.22, "learning_rate": 0.00011721476292404487, "loss": 0.0111, "step": 112720 }, { "epoch": 1.22, "learning_rate": 0.00011719854705844197, "loss": 0.009, "step": 112730 }, { "epoch": 1.22, "learning_rate": 0.00011718233119283905, "loss": 0.0108, "step": 112740 }, { "epoch": 1.22, "learning_rate": 0.00011716611532723616, "loss": 0.0109, "step": 112750 }, { "epoch": 1.22, "learning_rate": 0.00011714989946163324, "loss": 0.0092, "step": 112760 }, { "epoch": 1.22, "learning_rate": 0.00011713368359603035, "loss": 0.0105, "step": 112770 }, { "epoch": 1.22, "learning_rate": 0.00011711746773042744, "loss": 0.0111, "step": 112780 }, { "epoch": 1.22, "learning_rate": 0.00011710125186482453, "loss": 0.0099, "step": 112790 }, { "epoch": 1.22, "learning_rate": 0.00011708503599922162, "loss": 0.0099, "step": 112800 }, { "epoch": 1.22, "learning_rate": 0.00011706882013361873, "loss": 0.0118, "step": 112810 }, { "epoch": 1.22, "learning_rate": 0.00011705260426801581, "loss": 0.0102, "step": 112820 }, { "epoch": 1.22, "learning_rate": 0.00011703638840241292, "loss": 0.0101, "step": 112830 }, { "epoch": 1.22, "learning_rate": 0.00011702017253681, "loss": 0.0118, "step": 112840 }, { "epoch": 1.22, "learning_rate": 0.0001170039566712071, "loss": 0.0082, "step": 112850 }, { "epoch": 1.22, "learning_rate": 0.00011698774080560418, "loss": 0.0077, "step": 112860 }, { "epoch": 1.22, "learning_rate": 0.00011697152494000129, "loss": 0.0082, "step": 112870 }, { "epoch": 1.22, "learning_rate": 0.00011695530907439838, "loss": 0.0101, "step": 112880 }, { "epoch": 1.22, "learning_rate": 0.00011693909320879547, "loss": 0.0096, "step": 112890 }, { "epoch": 1.22, "learning_rate": 0.00011692287734319256, "loss": 0.0084, "step": 112900 }, { "epoch": 1.22, "learning_rate": 0.00011690666147758966, "loss": 0.0091, "step": 112910 }, { "epoch": 1.22, "learning_rate": 0.00011689044561198675, "loss": 0.0084, "step": 112920 }, { "epoch": 1.22, "learning_rate": 0.00011687422974638386, "loss": 0.013, "step": 112930 }, { "epoch": 1.22, "learning_rate": 0.00011685801388078095, "loss": 0.009, "step": 112940 }, { "epoch": 1.22, "learning_rate": 0.00011684179801517804, "loss": 0.0092, "step": 112950 }, { "epoch": 1.22, "learning_rate": 0.00011682558214957515, "loss": 0.0103, "step": 112960 }, { "epoch": 1.22, "learning_rate": 0.00011680936628397223, "loss": 0.0105, "step": 112970 }, { "epoch": 1.22, "learning_rate": 0.00011679315041836933, "loss": 0.0102, "step": 112980 }, { "epoch": 1.22, "learning_rate": 0.00011677693455276641, "loss": 0.009, "step": 112990 }, { "epoch": 1.22, "learning_rate": 0.00011676071868716352, "loss": 0.0093, "step": 113000 }, { "epoch": 1.22, "eval_cer": 0.9215060880381213, "eval_loss": 0.00777030223980546, "eval_runtime": 121.2227, "eval_samples_per_second": 16.499, "eval_steps_per_second": 4.125, "step": 113000 }, { "epoch": 1.22, "learning_rate": 0.0001167445028215606, "loss": 0.0089, "step": 113010 }, { "epoch": 1.22, "learning_rate": 0.0001167282869559577, "loss": 0.0096, "step": 113020 }, { "epoch": 1.22, "learning_rate": 0.0001167120710903548, "loss": 0.009, "step": 113030 }, { "epoch": 1.22, "learning_rate": 0.00011669585522475189, "loss": 0.0093, "step": 113040 }, { "epoch": 1.22, "learning_rate": 0.00011667963935914898, "loss": 0.0094, "step": 113050 }, { "epoch": 1.22, "learning_rate": 0.00011666342349354608, "loss": 0.0091, "step": 113060 }, { "epoch": 1.22, "learning_rate": 0.00011664720762794317, "loss": 0.008, "step": 113070 }, { "epoch": 1.22, "learning_rate": 0.00011663099176234027, "loss": 0.0107, "step": 113080 }, { "epoch": 1.22, "learning_rate": 0.00011661477589673735, "loss": 0.0096, "step": 113090 }, { "epoch": 1.22, "learning_rate": 0.00011659856003113446, "loss": 0.0087, "step": 113100 }, { "epoch": 1.22, "learning_rate": 0.00011658234416553154, "loss": 0.0101, "step": 113110 }, { "epoch": 1.22, "learning_rate": 0.00011656612829992865, "loss": 0.0118, "step": 113120 }, { "epoch": 1.22, "learning_rate": 0.00011654991243432573, "loss": 0.0107, "step": 113130 }, { "epoch": 1.22, "learning_rate": 0.00011653369656872283, "loss": 0.0087, "step": 113140 }, { "epoch": 1.22, "learning_rate": 0.00011651748070311992, "loss": 0.0101, "step": 113150 }, { "epoch": 1.22, "learning_rate": 0.00011650126483751702, "loss": 0.0109, "step": 113160 }, { "epoch": 1.22, "learning_rate": 0.00011648504897191411, "loss": 0.0076, "step": 113170 }, { "epoch": 1.22, "learning_rate": 0.00011646883310631122, "loss": 0.0117, "step": 113180 }, { "epoch": 1.22, "learning_rate": 0.0001164526172407083, "loss": 0.0085, "step": 113190 }, { "epoch": 1.22, "learning_rate": 0.0001164364013751054, "loss": 0.0085, "step": 113200 }, { "epoch": 1.22, "learning_rate": 0.00011642018550950248, "loss": 0.0091, "step": 113210 }, { "epoch": 1.22, "learning_rate": 0.00011640396964389959, "loss": 0.0099, "step": 113220 }, { "epoch": 1.22, "learning_rate": 0.00011638775377829667, "loss": 0.0095, "step": 113230 }, { "epoch": 1.22, "learning_rate": 0.00011637153791269377, "loss": 0.0102, "step": 113240 }, { "epoch": 1.22, "learning_rate": 0.00011635532204709087, "loss": 0.0125, "step": 113250 }, { "epoch": 1.22, "learning_rate": 0.00011633910618148796, "loss": 0.0106, "step": 113260 }, { "epoch": 1.22, "learning_rate": 0.00011632289031588505, "loss": 0.0115, "step": 113270 }, { "epoch": 1.22, "learning_rate": 0.00011630667445028216, "loss": 0.0111, "step": 113280 }, { "epoch": 1.22, "learning_rate": 0.00011629045858467924, "loss": 0.0098, "step": 113290 }, { "epoch": 1.22, "learning_rate": 0.00011627424271907634, "loss": 0.0106, "step": 113300 }, { "epoch": 1.22, "learning_rate": 0.00011625802685347342, "loss": 0.0097, "step": 113310 }, { "epoch": 1.23, "learning_rate": 0.00011624181098787053, "loss": 0.009, "step": 113320 }, { "epoch": 1.23, "learning_rate": 0.00011622559512226761, "loss": 0.0073, "step": 113330 }, { "epoch": 1.23, "learning_rate": 0.00011620937925666471, "loss": 0.01, "step": 113340 }, { "epoch": 1.23, "learning_rate": 0.0001161931633910618, "loss": 0.0091, "step": 113350 }, { "epoch": 1.23, "learning_rate": 0.0001161769475254589, "loss": 0.0109, "step": 113360 }, { "epoch": 1.23, "learning_rate": 0.00011616073165985599, "loss": 0.0092, "step": 113370 }, { "epoch": 1.23, "learning_rate": 0.00011614451579425308, "loss": 0.0103, "step": 113380 }, { "epoch": 1.23, "learning_rate": 0.00011612829992865018, "loss": 0.0102, "step": 113390 }, { "epoch": 1.23, "learning_rate": 0.00011611208406304728, "loss": 0.0112, "step": 113400 }, { "epoch": 1.23, "learning_rate": 0.00011609586819744436, "loss": 0.0081, "step": 113410 }, { "epoch": 1.23, "learning_rate": 0.00011607965233184147, "loss": 0.0117, "step": 113420 }, { "epoch": 1.23, "learning_rate": 0.00011606343646623855, "loss": 0.0126, "step": 113430 }, { "epoch": 1.23, "learning_rate": 0.00011604722060063565, "loss": 0.0102, "step": 113440 }, { "epoch": 1.23, "learning_rate": 0.00011603100473503273, "loss": 0.0109, "step": 113450 }, { "epoch": 1.23, "learning_rate": 0.00011601478886942984, "loss": 0.0096, "step": 113460 }, { "epoch": 1.23, "learning_rate": 0.00011599857300382693, "loss": 0.0096, "step": 113470 }, { "epoch": 1.23, "learning_rate": 0.00011598235713822403, "loss": 0.0114, "step": 113480 }, { "epoch": 1.23, "learning_rate": 0.00011596614127262112, "loss": 0.0106, "step": 113490 }, { "epoch": 1.23, "learning_rate": 0.00011594992540701822, "loss": 0.0113, "step": 113500 }, { "epoch": 1.23, "learning_rate": 0.0001159337095414153, "loss": 0.0088, "step": 113510 }, { "epoch": 1.23, "learning_rate": 0.00011591749367581241, "loss": 0.0079, "step": 113520 }, { "epoch": 1.23, "learning_rate": 0.00011590127781020949, "loss": 0.0096, "step": 113530 }, { "epoch": 1.23, "learning_rate": 0.0001158850619446066, "loss": 0.0122, "step": 113540 }, { "epoch": 1.23, "learning_rate": 0.00011586884607900367, "loss": 0.0099, "step": 113550 }, { "epoch": 1.23, "learning_rate": 0.00011585263021340078, "loss": 0.0086, "step": 113560 }, { "epoch": 1.23, "learning_rate": 0.00011583641434779787, "loss": 0.0094, "step": 113570 }, { "epoch": 1.23, "learning_rate": 0.00011582019848219497, "loss": 0.0106, "step": 113580 }, { "epoch": 1.23, "learning_rate": 0.00011580398261659206, "loss": 0.0117, "step": 113590 }, { "epoch": 1.23, "learning_rate": 0.00011578776675098915, "loss": 0.009, "step": 113600 }, { "epoch": 1.23, "learning_rate": 0.00011577155088538624, "loss": 0.012, "step": 113610 }, { "epoch": 1.23, "learning_rate": 0.00011575533501978335, "loss": 0.0104, "step": 113620 }, { "epoch": 1.23, "learning_rate": 0.00011573911915418043, "loss": 0.0078, "step": 113630 }, { "epoch": 1.23, "learning_rate": 0.00011572290328857754, "loss": 0.0093, "step": 113640 }, { "epoch": 1.23, "learning_rate": 0.00011570668742297464, "loss": 0.0093, "step": 113650 }, { "epoch": 1.23, "learning_rate": 0.00011569047155737172, "loss": 0.0111, "step": 113660 }, { "epoch": 1.23, "learning_rate": 0.00011567425569176883, "loss": 0.0078, "step": 113670 }, { "epoch": 1.23, "learning_rate": 0.00011565803982616591, "loss": 0.0095, "step": 113680 }, { "epoch": 1.23, "learning_rate": 0.00011564182396056301, "loss": 0.0081, "step": 113690 }, { "epoch": 1.23, "learning_rate": 0.00011562560809496009, "loss": 0.0102, "step": 113700 }, { "epoch": 1.23, "learning_rate": 0.0001156093922293572, "loss": 0.0097, "step": 113710 }, { "epoch": 1.23, "learning_rate": 0.00011559317636375429, "loss": 0.0094, "step": 113720 }, { "epoch": 1.23, "learning_rate": 0.00011557696049815138, "loss": 0.0104, "step": 113730 }, { "epoch": 1.23, "learning_rate": 0.00011556074463254848, "loss": 0.0111, "step": 113740 }, { "epoch": 1.23, "learning_rate": 0.00011554452876694557, "loss": 0.0099, "step": 113750 }, { "epoch": 1.23, "learning_rate": 0.00011552831290134266, "loss": 0.0099, "step": 113760 }, { "epoch": 1.23, "learning_rate": 0.00011551209703573977, "loss": 0.0086, "step": 113770 }, { "epoch": 1.23, "learning_rate": 0.00011549588117013685, "loss": 0.0092, "step": 113780 }, { "epoch": 1.23, "learning_rate": 0.00011547966530453395, "loss": 0.0139, "step": 113790 }, { "epoch": 1.23, "learning_rate": 0.00011546344943893103, "loss": 0.012, "step": 113800 }, { "epoch": 1.23, "learning_rate": 0.00011544723357332814, "loss": 0.0102, "step": 113810 }, { "epoch": 1.23, "learning_rate": 0.00011543101770772523, "loss": 0.014, "step": 113820 }, { "epoch": 1.23, "learning_rate": 0.00011541480184212233, "loss": 0.01, "step": 113830 }, { "epoch": 1.23, "learning_rate": 0.00011539858597651942, "loss": 0.0103, "step": 113840 }, { "epoch": 1.23, "learning_rate": 0.00011538237011091651, "loss": 0.009, "step": 113850 }, { "epoch": 1.23, "learning_rate": 0.0001153661542453136, "loss": 0.0108, "step": 113860 }, { "epoch": 1.23, "learning_rate": 0.00011534993837971071, "loss": 0.0088, "step": 113870 }, { "epoch": 1.23, "learning_rate": 0.00011533372251410779, "loss": 0.0103, "step": 113880 }, { "epoch": 1.23, "learning_rate": 0.0001153175066485049, "loss": 0.0099, "step": 113890 }, { "epoch": 1.23, "learning_rate": 0.00011530129078290197, "loss": 0.0082, "step": 113900 }, { "epoch": 1.23, "learning_rate": 0.00011528507491729908, "loss": 0.0099, "step": 113910 }, { "epoch": 1.23, "learning_rate": 0.00011526885905169616, "loss": 0.0117, "step": 113920 }, { "epoch": 1.23, "learning_rate": 0.00011525264318609327, "loss": 0.0095, "step": 113930 }, { "epoch": 1.23, "learning_rate": 0.00011523642732049036, "loss": 0.0106, "step": 113940 }, { "epoch": 1.23, "learning_rate": 0.00011522021145488745, "loss": 0.01, "step": 113950 }, { "epoch": 1.23, "learning_rate": 0.00011520399558928454, "loss": 0.0125, "step": 113960 }, { "epoch": 1.23, "learning_rate": 0.00011518777972368165, "loss": 0.0096, "step": 113970 }, { "epoch": 1.23, "learning_rate": 0.00011517156385807873, "loss": 0.0075, "step": 113980 }, { "epoch": 1.23, "learning_rate": 0.00011515534799247584, "loss": 0.0098, "step": 113990 }, { "epoch": 1.23, "learning_rate": 0.00011513913212687292, "loss": 0.0106, "step": 114000 }, { "epoch": 1.23, "eval_cer": 0.9215460437741146, "eval_loss": 0.007686339318752289, "eval_runtime": 121.2235, "eval_samples_per_second": 16.498, "eval_steps_per_second": 4.125, "step": 114000 }, { "epoch": 1.23, "learning_rate": 0.00011512291626127002, "loss": 0.0088, "step": 114010 }, { "epoch": 1.23, "learning_rate": 0.0001151067003956671, "loss": 0.0096, "step": 114020 }, { "epoch": 1.23, "learning_rate": 0.00011509048453006421, "loss": 0.0098, "step": 114030 }, { "epoch": 1.23, "learning_rate": 0.0001150742686644613, "loss": 0.0096, "step": 114040 }, { "epoch": 1.23, "learning_rate": 0.00011505805279885839, "loss": 0.01, "step": 114050 }, { "epoch": 1.23, "learning_rate": 0.00011504183693325549, "loss": 0.0097, "step": 114060 }, { "epoch": 1.23, "learning_rate": 0.00011502562106765258, "loss": 0.0134, "step": 114070 }, { "epoch": 1.23, "learning_rate": 0.00011500940520204967, "loss": 0.008, "step": 114080 }, { "epoch": 1.23, "learning_rate": 0.00011499318933644678, "loss": 0.0089, "step": 114090 }, { "epoch": 1.23, "learning_rate": 0.00011497697347084386, "loss": 0.0088, "step": 114100 }, { "epoch": 1.23, "learning_rate": 0.00011496075760524096, "loss": 0.01, "step": 114110 }, { "epoch": 1.23, "learning_rate": 0.00011494454173963804, "loss": 0.0098, "step": 114120 }, { "epoch": 1.23, "learning_rate": 0.00011492832587403515, "loss": 0.0083, "step": 114130 }, { "epoch": 1.23, "learning_rate": 0.00011491211000843223, "loss": 0.0094, "step": 114140 }, { "epoch": 1.23, "learning_rate": 0.00011489589414282933, "loss": 0.0122, "step": 114150 }, { "epoch": 1.23, "learning_rate": 0.00011487967827722643, "loss": 0.0091, "step": 114160 }, { "epoch": 1.23, "learning_rate": 0.00011486346241162352, "loss": 0.01, "step": 114170 }, { "epoch": 1.23, "learning_rate": 0.00011484724654602061, "loss": 0.0107, "step": 114180 }, { "epoch": 1.23, "learning_rate": 0.00011483103068041772, "loss": 0.0113, "step": 114190 }, { "epoch": 1.23, "learning_rate": 0.0001148148148148148, "loss": 0.0063, "step": 114200 }, { "epoch": 1.23, "learning_rate": 0.0001147985989492119, "loss": 0.0105, "step": 114210 }, { "epoch": 1.23, "learning_rate": 0.00011478238308360898, "loss": 0.0101, "step": 114220 }, { "epoch": 1.23, "learning_rate": 0.00011476616721800609, "loss": 0.0092, "step": 114230 }, { "epoch": 1.23, "learning_rate": 0.00011474995135240317, "loss": 0.0105, "step": 114240 }, { "epoch": 1.24, "learning_rate": 0.00011473373548680027, "loss": 0.0076, "step": 114250 }, { "epoch": 1.24, "learning_rate": 0.00011471751962119737, "loss": 0.0078, "step": 114260 }, { "epoch": 1.24, "learning_rate": 0.00011470130375559446, "loss": 0.01, "step": 114270 }, { "epoch": 1.24, "learning_rate": 0.00011468508788999155, "loss": 0.0082, "step": 114280 }, { "epoch": 1.24, "learning_rate": 0.00011466887202438865, "loss": 0.0123, "step": 114290 }, { "epoch": 1.24, "learning_rate": 0.00011465265615878574, "loss": 0.0089, "step": 114300 }, { "epoch": 1.24, "learning_rate": 0.00011463644029318285, "loss": 0.009, "step": 114310 }, { "epoch": 1.24, "learning_rate": 0.00011462022442757992, "loss": 0.0073, "step": 114320 }, { "epoch": 1.24, "learning_rate": 0.00011460400856197703, "loss": 0.0093, "step": 114330 }, { "epoch": 1.24, "learning_rate": 0.00011458779269637411, "loss": 0.0082, "step": 114340 }, { "epoch": 1.24, "learning_rate": 0.00011457157683077122, "loss": 0.0073, "step": 114350 }, { "epoch": 1.24, "learning_rate": 0.00011455536096516831, "loss": 0.008, "step": 114360 }, { "epoch": 1.24, "learning_rate": 0.0001145391450995654, "loss": 0.0074, "step": 114370 }, { "epoch": 1.24, "learning_rate": 0.00011452292923396251, "loss": 0.0086, "step": 114380 }, { "epoch": 1.24, "learning_rate": 0.00011450671336835959, "loss": 0.0088, "step": 114390 }, { "epoch": 1.24, "learning_rate": 0.0001144904975027567, "loss": 0.0071, "step": 114400 }, { "epoch": 1.24, "learning_rate": 0.00011447428163715379, "loss": 0.0126, "step": 114410 }, { "epoch": 1.24, "learning_rate": 0.00011445806577155088, "loss": 0.0089, "step": 114420 }, { "epoch": 1.24, "learning_rate": 0.00011444184990594797, "loss": 0.013, "step": 114430 }, { "epoch": 1.24, "learning_rate": 0.00011442563404034508, "loss": 0.0086, "step": 114440 }, { "epoch": 1.24, "learning_rate": 0.00011440941817474216, "loss": 0.0098, "step": 114450 }, { "epoch": 1.24, "learning_rate": 0.00011439320230913926, "loss": 0.011, "step": 114460 }, { "epoch": 1.24, "learning_rate": 0.00011437698644353634, "loss": 0.01, "step": 114470 }, { "epoch": 1.24, "learning_rate": 0.00011436077057793345, "loss": 0.0101, "step": 114480 }, { "epoch": 1.24, "learning_rate": 0.00011434455471233053, "loss": 0.0097, "step": 114490 }, { "epoch": 1.24, "learning_rate": 0.00011432833884672763, "loss": 0.0104, "step": 114500 }, { "epoch": 1.24, "learning_rate": 0.00011431212298112473, "loss": 0.0109, "step": 114510 }, { "epoch": 1.24, "learning_rate": 0.00011429590711552182, "loss": 0.0136, "step": 114520 }, { "epoch": 1.24, "learning_rate": 0.00011427969124991891, "loss": 0.0072, "step": 114530 }, { "epoch": 1.24, "learning_rate": 0.000114263475384316, "loss": 0.0099, "step": 114540 }, { "epoch": 1.24, "learning_rate": 0.0001142472595187131, "loss": 0.0115, "step": 114550 }, { "epoch": 1.24, "learning_rate": 0.0001142310436531102, "loss": 0.011, "step": 114560 }, { "epoch": 1.24, "learning_rate": 0.00011421482778750728, "loss": 0.0114, "step": 114570 }, { "epoch": 1.24, "learning_rate": 0.00011419861192190439, "loss": 0.0091, "step": 114580 }, { "epoch": 1.24, "learning_rate": 0.00011418239605630147, "loss": 0.0075, "step": 114590 }, { "epoch": 1.24, "learning_rate": 0.00011416618019069858, "loss": 0.0107, "step": 114600 }, { "epoch": 1.24, "learning_rate": 0.00011414996432509565, "loss": 0.009, "step": 114610 }, { "epoch": 1.24, "learning_rate": 0.00011413374845949276, "loss": 0.0107, "step": 114620 }, { "epoch": 1.24, "learning_rate": 0.00011411753259388985, "loss": 0.0091, "step": 114630 }, { "epoch": 1.24, "learning_rate": 0.00011410131672828695, "loss": 0.0108, "step": 114640 }, { "epoch": 1.24, "learning_rate": 0.00011408510086268404, "loss": 0.0112, "step": 114650 }, { "epoch": 1.24, "learning_rate": 0.00011406888499708115, "loss": 0.0096, "step": 114660 }, { "epoch": 1.24, "learning_rate": 0.00011405266913147822, "loss": 0.0082, "step": 114670 }, { "epoch": 1.24, "learning_rate": 0.00011403645326587533, "loss": 0.0123, "step": 114680 }, { "epoch": 1.24, "learning_rate": 0.00011402023740027241, "loss": 0.0101, "step": 114690 }, { "epoch": 1.24, "learning_rate": 0.00011400402153466952, "loss": 0.01, "step": 114700 }, { "epoch": 1.24, "learning_rate": 0.0001139878056690666, "loss": 0.0118, "step": 114710 }, { "epoch": 1.24, "learning_rate": 0.0001139715898034637, "loss": 0.0081, "step": 114720 }, { "epoch": 1.24, "learning_rate": 0.0001139553739378608, "loss": 0.0122, "step": 114730 }, { "epoch": 1.24, "learning_rate": 0.00011393915807225789, "loss": 0.0106, "step": 114740 }, { "epoch": 1.24, "learning_rate": 0.00011392294220665498, "loss": 0.008, "step": 114750 }, { "epoch": 1.24, "learning_rate": 0.00011390672634105207, "loss": 0.0083, "step": 114760 }, { "epoch": 1.24, "learning_rate": 0.00011389051047544917, "loss": 0.0093, "step": 114770 }, { "epoch": 1.24, "learning_rate": 0.00011387429460984627, "loss": 0.0092, "step": 114780 }, { "epoch": 1.24, "learning_rate": 0.00011385807874424335, "loss": 0.0077, "step": 114790 }, { "epoch": 1.24, "learning_rate": 0.00011384186287864046, "loss": 0.0093, "step": 114800 }, { "epoch": 1.24, "learning_rate": 0.00011382564701303754, "loss": 0.0086, "step": 114810 }, { "epoch": 1.24, "learning_rate": 0.00011380943114743464, "loss": 0.0101, "step": 114820 }, { "epoch": 1.24, "learning_rate": 0.00011379321528183174, "loss": 0.0096, "step": 114830 }, { "epoch": 1.24, "learning_rate": 0.00011377699941622883, "loss": 0.0093, "step": 114840 }, { "epoch": 1.24, "learning_rate": 0.00011376078355062592, "loss": 0.0125, "step": 114850 }, { "epoch": 1.24, "learning_rate": 0.00011374456768502301, "loss": 0.0084, "step": 114860 }, { "epoch": 1.24, "learning_rate": 0.0001137283518194201, "loss": 0.0104, "step": 114870 }, { "epoch": 1.24, "learning_rate": 0.00011371213595381721, "loss": 0.0088, "step": 114880 }, { "epoch": 1.24, "learning_rate": 0.00011369592008821429, "loss": 0.0119, "step": 114890 }, { "epoch": 1.24, "learning_rate": 0.0001136797042226114, "loss": 0.0079, "step": 114900 }, { "epoch": 1.24, "learning_rate": 0.00011366348835700848, "loss": 0.0098, "step": 114910 }, { "epoch": 1.24, "learning_rate": 0.00011364727249140558, "loss": 0.0098, "step": 114920 }, { "epoch": 1.24, "learning_rate": 0.00011363105662580266, "loss": 0.009, "step": 114930 }, { "epoch": 1.24, "learning_rate": 0.00011361484076019977, "loss": 0.0091, "step": 114940 }, { "epoch": 1.24, "learning_rate": 0.00011359862489459686, "loss": 0.0114, "step": 114950 }, { "epoch": 1.24, "learning_rate": 0.00011358240902899395, "loss": 0.0096, "step": 114960 }, { "epoch": 1.24, "learning_rate": 0.00011356619316339105, "loss": 0.0107, "step": 114970 }, { "epoch": 1.24, "learning_rate": 0.00011354997729778815, "loss": 0.0098, "step": 114980 }, { "epoch": 1.24, "learning_rate": 0.00011353376143218523, "loss": 0.0083, "step": 114990 }, { "epoch": 1.24, "learning_rate": 0.00011351754556658234, "loss": 0.0107, "step": 115000 }, { "epoch": 1.24, "eval_cer": 0.9215182484795105, "eval_loss": 0.007636575493961573, "eval_runtime": 121.1591, "eval_samples_per_second": 16.507, "eval_steps_per_second": 4.127, "step": 115000 }, { "epoch": 1.24, "learning_rate": 0.00011350132970097942, "loss": 0.0077, "step": 115010 }, { "epoch": 1.24, "learning_rate": 0.00011348511383537652, "loss": 0.0091, "step": 115020 }, { "epoch": 1.24, "learning_rate": 0.0001134688979697736, "loss": 0.011, "step": 115030 }, { "epoch": 1.24, "learning_rate": 0.00011345268210417071, "loss": 0.0112, "step": 115040 }, { "epoch": 1.24, "learning_rate": 0.0001134364662385678, "loss": 0.01, "step": 115050 }, { "epoch": 1.24, "learning_rate": 0.0001134202503729649, "loss": 0.0122, "step": 115060 }, { "epoch": 1.24, "learning_rate": 0.00011340403450736199, "loss": 0.011, "step": 115070 }, { "epoch": 1.24, "learning_rate": 0.00011338781864175908, "loss": 0.0073, "step": 115080 }, { "epoch": 1.24, "learning_rate": 0.00011337160277615619, "loss": 0.0094, "step": 115090 }, { "epoch": 1.24, "learning_rate": 0.00011335538691055328, "loss": 0.0099, "step": 115100 }, { "epoch": 1.24, "learning_rate": 0.00011333917104495037, "loss": 0.0102, "step": 115110 }, { "epoch": 1.24, "learning_rate": 0.00011332295517934747, "loss": 0.0082, "step": 115120 }, { "epoch": 1.24, "learning_rate": 0.00011330673931374457, "loss": 0.0082, "step": 115130 }, { "epoch": 1.24, "learning_rate": 0.00011329052344814165, "loss": 0.0084, "step": 115140 }, { "epoch": 1.24, "learning_rate": 0.00011327430758253876, "loss": 0.0092, "step": 115150 }, { "epoch": 1.24, "learning_rate": 0.00011325809171693584, "loss": 0.0094, "step": 115160 }, { "epoch": 1.25, "learning_rate": 0.00011324187585133294, "loss": 0.0106, "step": 115170 }, { "epoch": 1.25, "learning_rate": 0.00011322565998573002, "loss": 0.0111, "step": 115180 }, { "epoch": 1.25, "learning_rate": 0.00011320944412012713, "loss": 0.0099, "step": 115190 }, { "epoch": 1.25, "learning_rate": 0.00011319322825452422, "loss": 0.0079, "step": 115200 }, { "epoch": 1.25, "learning_rate": 0.00011317701238892131, "loss": 0.0104, "step": 115210 }, { "epoch": 1.25, "learning_rate": 0.0001131607965233184, "loss": 0.0081, "step": 115220 }, { "epoch": 1.25, "learning_rate": 0.0001131445806577155, "loss": 0.0129, "step": 115230 }, { "epoch": 1.25, "learning_rate": 0.00011312836479211259, "loss": 0.0073, "step": 115240 }, { "epoch": 1.25, "learning_rate": 0.0001131121489265097, "loss": 0.01, "step": 115250 }, { "epoch": 1.25, "learning_rate": 0.00011309593306090678, "loss": 0.0116, "step": 115260 }, { "epoch": 1.25, "learning_rate": 0.00011307971719530388, "loss": 0.0106, "step": 115270 }, { "epoch": 1.25, "learning_rate": 0.00011306350132970096, "loss": 0.0076, "step": 115280 }, { "epoch": 1.25, "learning_rate": 0.00011304728546409807, "loss": 0.0101, "step": 115290 }, { "epoch": 1.25, "learning_rate": 0.00011303106959849515, "loss": 0.0104, "step": 115300 }, { "epoch": 1.25, "learning_rate": 0.00011301485373289225, "loss": 0.0107, "step": 115310 }, { "epoch": 1.25, "learning_rate": 0.00011299863786728935, "loss": 0.0089, "step": 115320 }, { "epoch": 1.25, "learning_rate": 0.00011298242200168644, "loss": 0.0085, "step": 115330 }, { "epoch": 1.25, "learning_rate": 0.00011296620613608353, "loss": 0.0085, "step": 115340 }, { "epoch": 1.25, "learning_rate": 0.00011294999027048064, "loss": 0.008, "step": 115350 }, { "epoch": 1.25, "learning_rate": 0.00011293377440487772, "loss": 0.009, "step": 115360 }, { "epoch": 1.25, "learning_rate": 0.00011291755853927482, "loss": 0.0108, "step": 115370 }, { "epoch": 1.25, "learning_rate": 0.0001129013426736719, "loss": 0.0128, "step": 115380 }, { "epoch": 1.25, "learning_rate": 0.00011288512680806901, "loss": 0.01, "step": 115390 }, { "epoch": 1.25, "learning_rate": 0.00011286891094246609, "loss": 0.0082, "step": 115400 }, { "epoch": 1.25, "learning_rate": 0.0001128526950768632, "loss": 0.0097, "step": 115410 }, { "epoch": 1.25, "learning_rate": 0.00011283647921126029, "loss": 0.0098, "step": 115420 }, { "epoch": 1.25, "learning_rate": 0.00011282026334565738, "loss": 0.0097, "step": 115430 }, { "epoch": 1.25, "learning_rate": 0.00011280404748005447, "loss": 0.0085, "step": 115440 }, { "epoch": 1.25, "learning_rate": 0.00011278783161445158, "loss": 0.0095, "step": 115450 }, { "epoch": 1.25, "learning_rate": 0.00011277161574884866, "loss": 0.0119, "step": 115460 }, { "epoch": 1.25, "learning_rate": 0.00011275539988324577, "loss": 0.0102, "step": 115470 }, { "epoch": 1.25, "learning_rate": 0.00011273918401764285, "loss": 0.009, "step": 115480 }, { "epoch": 1.25, "learning_rate": 0.00011272296815203995, "loss": 0.0096, "step": 115490 }, { "epoch": 1.25, "learning_rate": 0.00011270675228643703, "loss": 0.0083, "step": 115500 }, { "epoch": 1.25, "learning_rate": 0.00011269053642083414, "loss": 0.0097, "step": 115510 }, { "epoch": 1.25, "learning_rate": 0.00011267432055523123, "loss": 0.0109, "step": 115520 }, { "epoch": 1.25, "learning_rate": 0.00011265810468962832, "loss": 0.0098, "step": 115530 }, { "epoch": 1.25, "learning_rate": 0.00011264188882402542, "loss": 0.0084, "step": 115540 }, { "epoch": 1.25, "learning_rate": 0.00011262567295842251, "loss": 0.0104, "step": 115550 }, { "epoch": 1.25, "learning_rate": 0.0001126094570928196, "loss": 0.0121, "step": 115560 }, { "epoch": 1.25, "learning_rate": 0.00011259324122721671, "loss": 0.012, "step": 115570 }, { "epoch": 1.25, "learning_rate": 0.00011257702536161379, "loss": 0.0085, "step": 115580 }, { "epoch": 1.25, "learning_rate": 0.00011256080949601089, "loss": 0.0089, "step": 115590 }, { "epoch": 1.25, "learning_rate": 0.00011254459363040797, "loss": 0.0091, "step": 115600 }, { "epoch": 1.25, "learning_rate": 0.00011252837776480508, "loss": 0.0077, "step": 115610 }, { "epoch": 1.25, "learning_rate": 0.00011251216189920216, "loss": 0.0103, "step": 115620 }, { "epoch": 1.25, "learning_rate": 0.00011249594603359926, "loss": 0.0111, "step": 115630 }, { "epoch": 1.25, "learning_rate": 0.00011247973016799636, "loss": 0.0095, "step": 115640 }, { "epoch": 1.25, "learning_rate": 0.00011246351430239345, "loss": 0.0096, "step": 115650 }, { "epoch": 1.25, "learning_rate": 0.00011244729843679054, "loss": 0.0104, "step": 115660 }, { "epoch": 1.25, "learning_rate": 0.00011243108257118765, "loss": 0.0107, "step": 115670 }, { "epoch": 1.25, "learning_rate": 0.00011241486670558473, "loss": 0.0105, "step": 115680 }, { "epoch": 1.25, "learning_rate": 0.00011239865083998183, "loss": 0.0096, "step": 115690 }, { "epoch": 1.25, "learning_rate": 0.00011238243497437891, "loss": 0.0078, "step": 115700 }, { "epoch": 1.25, "learning_rate": 0.00011236621910877602, "loss": 0.0111, "step": 115710 }, { "epoch": 1.25, "learning_rate": 0.0001123500032431731, "loss": 0.0124, "step": 115720 }, { "epoch": 1.25, "learning_rate": 0.0001123337873775702, "loss": 0.0101, "step": 115730 }, { "epoch": 1.25, "learning_rate": 0.0001123175715119673, "loss": 0.008, "step": 115740 }, { "epoch": 1.25, "learning_rate": 0.00011230135564636439, "loss": 0.0071, "step": 115750 }, { "epoch": 1.25, "learning_rate": 0.00011228513978076148, "loss": 0.0111, "step": 115760 }, { "epoch": 1.25, "learning_rate": 0.00011226892391515858, "loss": 0.0125, "step": 115770 }, { "epoch": 1.25, "learning_rate": 0.00011225270804955567, "loss": 0.01, "step": 115780 }, { "epoch": 1.25, "learning_rate": 0.00011223649218395277, "loss": 0.0092, "step": 115790 }, { "epoch": 1.25, "learning_rate": 0.00011222027631834985, "loss": 0.0103, "step": 115800 }, { "epoch": 1.25, "learning_rate": 0.00011220406045274696, "loss": 0.0084, "step": 115810 }, { "epoch": 1.25, "learning_rate": 0.00011218784458714407, "loss": 0.0112, "step": 115820 }, { "epoch": 1.25, "learning_rate": 0.00011217162872154115, "loss": 0.0081, "step": 115830 }, { "epoch": 1.25, "learning_rate": 0.00011215541285593825, "loss": 0.0087, "step": 115840 }, { "epoch": 1.25, "learning_rate": 0.00011213919699033533, "loss": 0.0099, "step": 115850 }, { "epoch": 1.25, "learning_rate": 0.00011212298112473244, "loss": 0.008, "step": 115860 }, { "epoch": 1.25, "learning_rate": 0.00011210676525912952, "loss": 0.0097, "step": 115870 }, { "epoch": 1.25, "learning_rate": 0.00011209054939352662, "loss": 0.0094, "step": 115880 }, { "epoch": 1.25, "learning_rate": 0.00011207433352792372, "loss": 0.0114, "step": 115890 }, { "epoch": 1.25, "learning_rate": 0.00011205811766232081, "loss": 0.0111, "step": 115900 }, { "epoch": 1.25, "learning_rate": 0.0001120419017967179, "loss": 0.0106, "step": 115910 }, { "epoch": 1.25, "learning_rate": 0.000112025685931115, "loss": 0.0092, "step": 115920 }, { "epoch": 1.25, "learning_rate": 0.00011200947006551209, "loss": 0.0107, "step": 115930 }, { "epoch": 1.25, "learning_rate": 0.00011199325419990919, "loss": 0.0088, "step": 115940 }, { "epoch": 1.25, "learning_rate": 0.00011197703833430627, "loss": 0.0096, "step": 115950 }, { "epoch": 1.25, "learning_rate": 0.00011196082246870338, "loss": 0.0103, "step": 115960 }, { "epoch": 1.25, "learning_rate": 0.00011194460660310046, "loss": 0.0083, "step": 115970 }, { "epoch": 1.25, "learning_rate": 0.00011192839073749756, "loss": 0.0113, "step": 115980 }, { "epoch": 1.25, "learning_rate": 0.00011191217487189466, "loss": 0.0094, "step": 115990 }, { "epoch": 1.25, "learning_rate": 0.00011189595900629175, "loss": 0.0111, "step": 116000 }, { "epoch": 1.25, "eval_cer": 0.9215382263475072, "eval_loss": 0.00765196094289422, "eval_runtime": 121.1107, "eval_samples_per_second": 16.514, "eval_steps_per_second": 4.128, "step": 116000 }, { "epoch": 1.25, "learning_rate": 0.00011187974314068884, "loss": 0.0092, "step": 116010 }, { "epoch": 1.25, "learning_rate": 0.00011186352727508593, "loss": 0.0104, "step": 116020 }, { "epoch": 1.25, "learning_rate": 0.00011184731140948303, "loss": 0.0085, "step": 116030 }, { "epoch": 1.25, "learning_rate": 0.00011183109554388013, "loss": 0.0101, "step": 116040 }, { "epoch": 1.25, "learning_rate": 0.00011181487967827721, "loss": 0.009, "step": 116050 }, { "epoch": 1.25, "learning_rate": 0.00011179866381267432, "loss": 0.0092, "step": 116060 }, { "epoch": 1.25, "learning_rate": 0.0001117824479470714, "loss": 0.0092, "step": 116070 }, { "epoch": 1.25, "learning_rate": 0.0001117662320814685, "loss": 0.0114, "step": 116080 }, { "epoch": 1.25, "learning_rate": 0.00011175001621586558, "loss": 0.0094, "step": 116090 }, { "epoch": 1.26, "learning_rate": 0.00011173380035026269, "loss": 0.0096, "step": 116100 }, { "epoch": 1.26, "learning_rate": 0.00011171758448465978, "loss": 0.0091, "step": 116110 }, { "epoch": 1.26, "learning_rate": 0.00011170136861905688, "loss": 0.0098, "step": 116120 }, { "epoch": 1.26, "learning_rate": 0.00011168515275345397, "loss": 0.01, "step": 116130 }, { "epoch": 1.26, "learning_rate": 0.00011166893688785107, "loss": 0.0069, "step": 116140 }, { "epoch": 1.26, "learning_rate": 0.00011165272102224815, "loss": 0.0082, "step": 116150 }, { "epoch": 1.26, "learning_rate": 0.00011163650515664526, "loss": 0.0092, "step": 116160 }, { "epoch": 1.26, "learning_rate": 0.00011162028929104234, "loss": 0.0091, "step": 116170 }, { "epoch": 1.26, "learning_rate": 0.00011160407342543945, "loss": 0.0083, "step": 116180 }, { "epoch": 1.26, "learning_rate": 0.00011158785755983652, "loss": 0.0075, "step": 116190 }, { "epoch": 1.26, "learning_rate": 0.00011157164169423363, "loss": 0.0113, "step": 116200 }, { "epoch": 1.26, "learning_rate": 0.00011155542582863072, "loss": 0.0114, "step": 116210 }, { "epoch": 1.26, "learning_rate": 0.00011153920996302782, "loss": 0.0087, "step": 116220 }, { "epoch": 1.26, "learning_rate": 0.00011152299409742491, "loss": 0.0082, "step": 116230 }, { "epoch": 1.26, "learning_rate": 0.000111506778231822, "loss": 0.0051, "step": 116240 }, { "epoch": 1.26, "learning_rate": 0.0001114905623662191, "loss": 0.0083, "step": 116250 }, { "epoch": 1.26, "learning_rate": 0.0001114743465006162, "loss": 0.0089, "step": 116260 }, { "epoch": 1.26, "learning_rate": 0.00011145813063501328, "loss": 0.0127, "step": 116270 }, { "epoch": 1.26, "learning_rate": 0.00011144191476941039, "loss": 0.0162, "step": 116280 }, { "epoch": 1.26, "learning_rate": 0.00011142569890380747, "loss": 0.0083, "step": 116290 }, { "epoch": 1.26, "learning_rate": 0.00011140948303820457, "loss": 0.0088, "step": 116300 }, { "epoch": 1.26, "learning_rate": 0.00011139326717260165, "loss": 0.0097, "step": 116310 }, { "epoch": 1.26, "learning_rate": 0.00011137705130699876, "loss": 0.0092, "step": 116320 }, { "epoch": 1.26, "learning_rate": 0.00011136083544139585, "loss": 0.0089, "step": 116330 }, { "epoch": 1.26, "learning_rate": 0.00011134461957579294, "loss": 0.0086, "step": 116340 }, { "epoch": 1.26, "learning_rate": 0.00011132840371019004, "loss": 0.0099, "step": 116350 }, { "epoch": 1.26, "learning_rate": 0.00011131218784458714, "loss": 0.0089, "step": 116360 }, { "epoch": 1.26, "learning_rate": 0.00011129597197898422, "loss": 0.0073, "step": 116370 }, { "epoch": 1.26, "learning_rate": 0.00011127975611338133, "loss": 0.0086, "step": 116380 }, { "epoch": 1.26, "learning_rate": 0.0001112635402477784, "loss": 0.0105, "step": 116390 }, { "epoch": 1.26, "learning_rate": 0.00011124732438217551, "loss": 0.0105, "step": 116400 }, { "epoch": 1.26, "learning_rate": 0.00011123110851657259, "loss": 0.0074, "step": 116410 }, { "epoch": 1.26, "learning_rate": 0.0001112148926509697, "loss": 0.0075, "step": 116420 }, { "epoch": 1.26, "learning_rate": 0.00011119867678536679, "loss": 0.0106, "step": 116430 }, { "epoch": 1.26, "learning_rate": 0.00011118246091976388, "loss": 0.0088, "step": 116440 }, { "epoch": 1.26, "learning_rate": 0.00011116624505416098, "loss": 0.0104, "step": 116450 }, { "epoch": 1.26, "learning_rate": 0.00011115002918855808, "loss": 0.0088, "step": 116460 }, { "epoch": 1.26, "learning_rate": 0.00011113381332295516, "loss": 0.0074, "step": 116470 }, { "epoch": 1.26, "learning_rate": 0.00011111759745735227, "loss": 0.0092, "step": 116480 }, { "epoch": 1.26, "learning_rate": 0.00011110138159174935, "loss": 0.0076, "step": 116490 }, { "epoch": 1.26, "learning_rate": 0.00011108516572614645, "loss": 0.0106, "step": 116500 }, { "epoch": 1.26, "learning_rate": 0.00011106894986054353, "loss": 0.0086, "step": 116510 }, { "epoch": 1.26, "learning_rate": 0.00011105273399494064, "loss": 0.0078, "step": 116520 }, { "epoch": 1.26, "learning_rate": 0.00011103651812933775, "loss": 0.0101, "step": 116530 }, { "epoch": 1.26, "learning_rate": 0.00011102030226373482, "loss": 0.0098, "step": 116540 }, { "epoch": 1.26, "learning_rate": 0.00011100408639813193, "loss": 0.0106, "step": 116550 }, { "epoch": 1.26, "learning_rate": 0.00011098787053252901, "loss": 0.0086, "step": 116560 }, { "epoch": 1.26, "learning_rate": 0.00011097165466692612, "loss": 0.0113, "step": 116570 }, { "epoch": 1.26, "learning_rate": 0.00011095543880132321, "loss": 0.009, "step": 116580 }, { "epoch": 1.26, "learning_rate": 0.0001109392229357203, "loss": 0.009, "step": 116590 }, { "epoch": 1.26, "learning_rate": 0.0001109230070701174, "loss": 0.0117, "step": 116600 }, { "epoch": 1.26, "learning_rate": 0.0001109067912045145, "loss": 0.0112, "step": 116610 }, { "epoch": 1.26, "learning_rate": 0.00011089057533891158, "loss": 0.0087, "step": 116620 }, { "epoch": 1.26, "learning_rate": 0.00011087435947330869, "loss": 0.009, "step": 116630 }, { "epoch": 1.26, "learning_rate": 0.00011085814360770577, "loss": 0.012, "step": 116640 }, { "epoch": 1.26, "learning_rate": 0.00011084192774210287, "loss": 0.0082, "step": 116650 }, { "epoch": 1.26, "learning_rate": 0.00011082571187649995, "loss": 0.0088, "step": 116660 }, { "epoch": 1.26, "learning_rate": 0.00011080949601089706, "loss": 0.0088, "step": 116670 }, { "epoch": 1.26, "learning_rate": 0.00011079328014529415, "loss": 0.0077, "step": 116680 }, { "epoch": 1.26, "learning_rate": 0.00011077706427969124, "loss": 0.0081, "step": 116690 }, { "epoch": 1.26, "learning_rate": 0.00011076084841408834, "loss": 0.0102, "step": 116700 }, { "epoch": 1.26, "learning_rate": 0.00011074463254848543, "loss": 0.0097, "step": 116710 }, { "epoch": 1.26, "learning_rate": 0.00011072841668288252, "loss": 0.0108, "step": 116720 }, { "epoch": 1.26, "learning_rate": 0.00011071220081727963, "loss": 0.0119, "step": 116730 }, { "epoch": 1.26, "learning_rate": 0.00011069598495167671, "loss": 0.0154, "step": 116740 }, { "epoch": 1.26, "learning_rate": 0.00011067976908607381, "loss": 0.0102, "step": 116750 }, { "epoch": 1.26, "learning_rate": 0.00011066355322047089, "loss": 0.0105, "step": 116760 }, { "epoch": 1.26, "learning_rate": 0.000110647337354868, "loss": 0.0095, "step": 116770 }, { "epoch": 1.26, "learning_rate": 0.00011063112148926508, "loss": 0.0082, "step": 116780 }, { "epoch": 1.26, "learning_rate": 0.00011061490562366218, "loss": 0.0094, "step": 116790 }, { "epoch": 1.26, "learning_rate": 0.00011059868975805928, "loss": 0.0123, "step": 116800 }, { "epoch": 1.26, "learning_rate": 0.00011058247389245637, "loss": 0.0088, "step": 116810 }, { "epoch": 1.26, "learning_rate": 0.00011056625802685346, "loss": 0.0107, "step": 116820 }, { "epoch": 1.26, "learning_rate": 0.00011055004216125057, "loss": 0.0121, "step": 116830 }, { "epoch": 1.26, "learning_rate": 0.00011053382629564765, "loss": 0.0101, "step": 116840 }, { "epoch": 1.26, "learning_rate": 0.00011051761043004475, "loss": 0.0083, "step": 116850 }, { "epoch": 1.26, "learning_rate": 0.00011050139456444183, "loss": 0.0095, "step": 116860 }, { "epoch": 1.26, "learning_rate": 0.00011048517869883894, "loss": 0.0097, "step": 116870 }, { "epoch": 1.26, "learning_rate": 0.00011046896283323602, "loss": 0.0093, "step": 116880 }, { "epoch": 1.26, "learning_rate": 0.00011045274696763313, "loss": 0.0127, "step": 116890 }, { "epoch": 1.26, "learning_rate": 0.00011043653110203022, "loss": 0.0114, "step": 116900 }, { "epoch": 1.26, "learning_rate": 0.00011042031523642731, "loss": 0.008, "step": 116910 }, { "epoch": 1.26, "learning_rate": 0.0001104040993708244, "loss": 0.0097, "step": 116920 }, { "epoch": 1.26, "learning_rate": 0.0001103878835052215, "loss": 0.0082, "step": 116930 }, { "epoch": 1.26, "learning_rate": 0.00011037166763961859, "loss": 0.0082, "step": 116940 }, { "epoch": 1.26, "learning_rate": 0.0001103554517740157, "loss": 0.0101, "step": 116950 }, { "epoch": 1.26, "learning_rate": 0.00011033923590841277, "loss": 0.0092, "step": 116960 }, { "epoch": 1.26, "learning_rate": 0.00011032302004280988, "loss": 0.0094, "step": 116970 }, { "epoch": 1.26, "learning_rate": 0.00011030680417720696, "loss": 0.0067, "step": 116980 }, { "epoch": 1.26, "learning_rate": 0.00011029058831160407, "loss": 0.0111, "step": 116990 }, { "epoch": 1.26, "learning_rate": 0.00011027437244600116, "loss": 0.0118, "step": 117000 }, { "epoch": 1.26, "eval_cer": 0.9215373577445508, "eval_loss": 0.007613795343786478, "eval_runtime": 121.1129, "eval_samples_per_second": 16.514, "eval_steps_per_second": 4.128, "step": 117000 }, { "epoch": 1.26, "learning_rate": 0.00011025815658039825, "loss": 0.0091, "step": 117010 }, { "epoch": 1.27, "learning_rate": 0.00011024194071479534, "loss": 0.011, "step": 117020 }, { "epoch": 1.27, "learning_rate": 0.00011022572484919244, "loss": 0.0087, "step": 117030 }, { "epoch": 1.27, "learning_rate": 0.00011020950898358953, "loss": 0.013, "step": 117040 }, { "epoch": 1.27, "learning_rate": 0.00011019329311798664, "loss": 0.0075, "step": 117050 }, { "epoch": 1.27, "learning_rate": 0.00011017707725238372, "loss": 0.0093, "step": 117060 }, { "epoch": 1.27, "learning_rate": 0.00011016086138678082, "loss": 0.0104, "step": 117070 }, { "epoch": 1.27, "learning_rate": 0.0001101446455211779, "loss": 0.01, "step": 117080 }, { "epoch": 1.27, "learning_rate": 0.00011012842965557501, "loss": 0.0089, "step": 117090 }, { "epoch": 1.27, "learning_rate": 0.00011011221378997209, "loss": 0.0076, "step": 117100 }, { "epoch": 1.27, "learning_rate": 0.00011009599792436919, "loss": 0.0108, "step": 117110 }, { "epoch": 1.27, "learning_rate": 0.00011007978205876629, "loss": 0.0106, "step": 117120 }, { "epoch": 1.27, "learning_rate": 0.00011006356619316338, "loss": 0.0096, "step": 117130 }, { "epoch": 1.27, "learning_rate": 0.00011004735032756047, "loss": 0.0093, "step": 117140 }, { "epoch": 1.27, "learning_rate": 0.00011003113446195758, "loss": 0.0078, "step": 117150 }, { "epoch": 1.27, "learning_rate": 0.00011001491859635466, "loss": 0.0074, "step": 117160 }, { "epoch": 1.27, "learning_rate": 0.00010999870273075176, "loss": 0.0096, "step": 117170 }, { "epoch": 1.27, "learning_rate": 0.00010998248686514884, "loss": 0.008, "step": 117180 }, { "epoch": 1.27, "learning_rate": 0.00010996627099954595, "loss": 0.011, "step": 117190 }, { "epoch": 1.27, "learning_rate": 0.00010995005513394303, "loss": 0.0093, "step": 117200 }, { "epoch": 1.27, "learning_rate": 0.00010993383926834013, "loss": 0.009, "step": 117210 }, { "epoch": 1.27, "learning_rate": 0.00010991762340273723, "loss": 0.0091, "step": 117220 }, { "epoch": 1.27, "learning_rate": 0.00010990140753713432, "loss": 0.0082, "step": 117230 }, { "epoch": 1.27, "learning_rate": 0.00010988519167153141, "loss": 0.0081, "step": 117240 }, { "epoch": 1.27, "learning_rate": 0.0001098689758059285, "loss": 0.0082, "step": 117250 }, { "epoch": 1.27, "learning_rate": 0.00010985275994032561, "loss": 0.0101, "step": 117260 }, { "epoch": 1.27, "learning_rate": 0.0001098365440747227, "loss": 0.0106, "step": 117270 }, { "epoch": 1.27, "learning_rate": 0.0001098203282091198, "loss": 0.0103, "step": 117280 }, { "epoch": 1.27, "learning_rate": 0.00010980411234351689, "loss": 0.0096, "step": 117290 }, { "epoch": 1.27, "learning_rate": 0.000109787896477914, "loss": 0.0102, "step": 117300 }, { "epoch": 1.27, "learning_rate": 0.00010977168061231107, "loss": 0.009, "step": 117310 }, { "epoch": 1.27, "learning_rate": 0.00010975546474670818, "loss": 0.0111, "step": 117320 }, { "epoch": 1.27, "learning_rate": 0.00010973924888110526, "loss": 0.0104, "step": 117330 }, { "epoch": 1.27, "learning_rate": 0.00010972303301550237, "loss": 0.0082, "step": 117340 }, { "epoch": 1.27, "learning_rate": 0.00010970681714989945, "loss": 0.01, "step": 117350 }, { "epoch": 1.27, "learning_rate": 0.00010969060128429655, "loss": 0.0094, "step": 117360 }, { "epoch": 1.27, "learning_rate": 0.00010967438541869364, "loss": 0.01, "step": 117370 }, { "epoch": 1.27, "learning_rate": 0.00010965816955309074, "loss": 0.0105, "step": 117380 }, { "epoch": 1.27, "learning_rate": 0.00010964195368748783, "loss": 0.009, "step": 117390 }, { "epoch": 1.27, "learning_rate": 0.00010962573782188492, "loss": 0.0094, "step": 117400 }, { "epoch": 1.27, "learning_rate": 0.00010960952195628202, "loss": 0.0087, "step": 117410 }, { "epoch": 1.27, "learning_rate": 0.00010959330609067912, "loss": 0.0096, "step": 117420 }, { "epoch": 1.27, "learning_rate": 0.0001095770902250762, "loss": 0.0105, "step": 117430 }, { "epoch": 1.27, "learning_rate": 0.00010956087435947331, "loss": 0.0082, "step": 117440 }, { "epoch": 1.27, "learning_rate": 0.00010954465849387039, "loss": 0.01, "step": 117450 }, { "epoch": 1.27, "learning_rate": 0.00010952844262826749, "loss": 0.0099, "step": 117460 }, { "epoch": 1.27, "learning_rate": 0.00010951222676266459, "loss": 0.0094, "step": 117470 }, { "epoch": 1.27, "learning_rate": 0.00010949601089706168, "loss": 0.0092, "step": 117480 }, { "epoch": 1.27, "learning_rate": 0.00010947979503145877, "loss": 0.0111, "step": 117490 }, { "epoch": 1.27, "learning_rate": 0.00010946357916585586, "loss": 0.009, "step": 117500 }, { "epoch": 1.27, "learning_rate": 0.00010944736330025296, "loss": 0.0123, "step": 117510 }, { "epoch": 1.27, "learning_rate": 0.00010943114743465006, "loss": 0.0107, "step": 117520 }, { "epoch": 1.27, "learning_rate": 0.00010941493156904714, "loss": 0.0081, "step": 117530 }, { "epoch": 1.27, "learning_rate": 0.00010939871570344425, "loss": 0.0098, "step": 117540 }, { "epoch": 1.27, "learning_rate": 0.00010938249983784133, "loss": 0.0085, "step": 117550 }, { "epoch": 1.27, "learning_rate": 0.00010936628397223843, "loss": 0.0098, "step": 117560 }, { "epoch": 1.27, "learning_rate": 0.00010935006810663551, "loss": 0.012, "step": 117570 }, { "epoch": 1.27, "learning_rate": 0.00010933385224103262, "loss": 0.0085, "step": 117580 }, { "epoch": 1.27, "learning_rate": 0.00010931763637542971, "loss": 0.0085, "step": 117590 }, { "epoch": 1.27, "learning_rate": 0.0001093014205098268, "loss": 0.0102, "step": 117600 }, { "epoch": 1.27, "learning_rate": 0.0001092852046442239, "loss": 0.009, "step": 117610 }, { "epoch": 1.27, "learning_rate": 0.000109268988778621, "loss": 0.0099, "step": 117620 }, { "epoch": 1.27, "learning_rate": 0.00010925277291301808, "loss": 0.0082, "step": 117630 }, { "epoch": 1.27, "learning_rate": 0.00010923655704741519, "loss": 0.0104, "step": 117640 }, { "epoch": 1.27, "learning_rate": 0.00010922034118181227, "loss": 0.0119, "step": 117650 }, { "epoch": 1.27, "learning_rate": 0.00010920412531620937, "loss": 0.008, "step": 117660 }, { "epoch": 1.27, "learning_rate": 0.00010918790945060645, "loss": 0.01, "step": 117670 }, { "epoch": 1.27, "learning_rate": 0.00010917169358500356, "loss": 0.0117, "step": 117680 }, { "epoch": 1.27, "learning_rate": 0.00010915547771940065, "loss": 0.0104, "step": 117690 }, { "epoch": 1.27, "learning_rate": 0.00010913926185379775, "loss": 0.0107, "step": 117700 }, { "epoch": 1.27, "learning_rate": 0.00010912304598819484, "loss": 0.0105, "step": 117710 }, { "epoch": 1.27, "learning_rate": 0.00010910683012259193, "loss": 0.0095, "step": 117720 }, { "epoch": 1.27, "learning_rate": 0.00010909061425698902, "loss": 0.0098, "step": 117730 }, { "epoch": 1.27, "learning_rate": 0.00010907439839138613, "loss": 0.0085, "step": 117740 }, { "epoch": 1.27, "learning_rate": 0.00010905818252578321, "loss": 0.0078, "step": 117750 }, { "epoch": 1.27, "learning_rate": 0.00010904196666018032, "loss": 0.0104, "step": 117760 }, { "epoch": 1.27, "learning_rate": 0.0001090257507945774, "loss": 0.0106, "step": 117770 }, { "epoch": 1.27, "learning_rate": 0.0001090095349289745, "loss": 0.0074, "step": 117780 }, { "epoch": 1.27, "learning_rate": 0.00010899331906337158, "loss": 0.0088, "step": 117790 }, { "epoch": 1.27, "learning_rate": 0.00010897710319776869, "loss": 0.0101, "step": 117800 }, { "epoch": 1.27, "learning_rate": 0.00010896088733216578, "loss": 0.0075, "step": 117810 }, { "epoch": 1.27, "learning_rate": 0.00010894467146656287, "loss": 0.0095, "step": 117820 }, { "epoch": 1.27, "learning_rate": 0.00010892845560095997, "loss": 0.0083, "step": 117830 }, { "epoch": 1.27, "learning_rate": 0.00010891223973535707, "loss": 0.0099, "step": 117840 }, { "epoch": 1.27, "learning_rate": 0.00010889602386975415, "loss": 0.0109, "step": 117850 }, { "epoch": 1.27, "learning_rate": 0.00010887980800415126, "loss": 0.0093, "step": 117860 }, { "epoch": 1.27, "learning_rate": 0.00010886359213854834, "loss": 0.0079, "step": 117870 }, { "epoch": 1.27, "learning_rate": 0.00010884737627294544, "loss": 0.0102, "step": 117880 }, { "epoch": 1.27, "learning_rate": 0.00010883116040734252, "loss": 0.0099, "step": 117890 }, { "epoch": 1.27, "learning_rate": 0.00010881494454173963, "loss": 0.0088, "step": 117900 }, { "epoch": 1.27, "learning_rate": 0.00010879872867613672, "loss": 0.0072, "step": 117910 }, { "epoch": 1.27, "learning_rate": 0.00010878251281053381, "loss": 0.0083, "step": 117920 }, { "epoch": 1.27, "learning_rate": 0.0001087662969449309, "loss": 0.0091, "step": 117930 }, { "epoch": 1.27, "learning_rate": 0.000108750081079328, "loss": 0.0096, "step": 117940 }, { "epoch": 1.28, "learning_rate": 0.00010873386521372509, "loss": 0.0102, "step": 117950 }, { "epoch": 1.28, "learning_rate": 0.0001087176493481222, "loss": 0.0085, "step": 117960 }, { "epoch": 1.28, "learning_rate": 0.00010870143348251929, "loss": 0.0069, "step": 117970 }, { "epoch": 1.28, "learning_rate": 0.00010868521761691638, "loss": 0.0096, "step": 117980 }, { "epoch": 1.28, "learning_rate": 0.00010866900175131349, "loss": 0.0092, "step": 117990 }, { "epoch": 1.28, "learning_rate": 0.00010865278588571057, "loss": 0.0088, "step": 118000 }, { "epoch": 1.28, "eval_cer": 0.9215364891415945, "eval_loss": 0.00760659808292985, "eval_runtime": 121.2431, "eval_samples_per_second": 16.496, "eval_steps_per_second": 4.124, "step": 118000 }, { "epoch": 1.28, "learning_rate": 0.00010863657002010768, "loss": 0.0099, "step": 118010 }, { "epoch": 1.28, "learning_rate": 0.00010862035415450475, "loss": 0.0088, "step": 118020 }, { "epoch": 1.28, "learning_rate": 0.00010860413828890186, "loss": 0.0089, "step": 118030 }, { "epoch": 1.28, "learning_rate": 0.00010858792242329894, "loss": 0.0087, "step": 118040 }, { "epoch": 1.28, "learning_rate": 0.00010857170655769605, "loss": 0.0098, "step": 118050 }, { "epoch": 1.28, "learning_rate": 0.00010855549069209314, "loss": 0.0089, "step": 118060 }, { "epoch": 1.28, "learning_rate": 0.00010853927482649023, "loss": 0.0102, "step": 118070 }, { "epoch": 1.28, "learning_rate": 0.00010852305896088732, "loss": 0.0084, "step": 118080 }, { "epoch": 1.28, "learning_rate": 0.00010850684309528442, "loss": 0.0087, "step": 118090 }, { "epoch": 1.28, "learning_rate": 0.00010849062722968151, "loss": 0.0092, "step": 118100 }, { "epoch": 1.28, "learning_rate": 0.00010847441136407862, "loss": 0.0097, "step": 118110 }, { "epoch": 1.28, "learning_rate": 0.0001084581954984757, "loss": 0.0103, "step": 118120 }, { "epoch": 1.28, "learning_rate": 0.0001084419796328728, "loss": 0.0093, "step": 118130 }, { "epoch": 1.28, "learning_rate": 0.00010842576376726988, "loss": 0.0092, "step": 118140 }, { "epoch": 1.28, "learning_rate": 0.00010840954790166699, "loss": 0.0089, "step": 118150 }, { "epoch": 1.28, "learning_rate": 0.00010839333203606408, "loss": 0.0073, "step": 118160 }, { "epoch": 1.28, "learning_rate": 0.00010837711617046117, "loss": 0.0093, "step": 118170 }, { "epoch": 1.28, "learning_rate": 0.00010836090030485827, "loss": 0.0088, "step": 118180 }, { "epoch": 1.28, "learning_rate": 0.00010834468443925536, "loss": 0.0109, "step": 118190 }, { "epoch": 1.28, "learning_rate": 0.00010832846857365245, "loss": 0.0083, "step": 118200 }, { "epoch": 1.28, "learning_rate": 0.00010831225270804956, "loss": 0.0083, "step": 118210 }, { "epoch": 1.28, "learning_rate": 0.00010829603684244664, "loss": 0.0083, "step": 118220 }, { "epoch": 1.28, "learning_rate": 0.00010827982097684374, "loss": 0.009, "step": 118230 }, { "epoch": 1.28, "learning_rate": 0.00010826360511124082, "loss": 0.0089, "step": 118240 }, { "epoch": 1.28, "learning_rate": 0.00010824738924563793, "loss": 0.0092, "step": 118250 }, { "epoch": 1.28, "learning_rate": 0.00010823117338003501, "loss": 0.0079, "step": 118260 }, { "epoch": 1.28, "learning_rate": 0.00010821495751443211, "loss": 0.0105, "step": 118270 }, { "epoch": 1.28, "learning_rate": 0.0001081987416488292, "loss": 0.0091, "step": 118280 }, { "epoch": 1.28, "learning_rate": 0.0001081825257832263, "loss": 0.0081, "step": 118290 }, { "epoch": 1.28, "learning_rate": 0.00010816630991762339, "loss": 0.0071, "step": 118300 }, { "epoch": 1.28, "learning_rate": 0.0001081500940520205, "loss": 0.0087, "step": 118310 }, { "epoch": 1.28, "learning_rate": 0.00010813387818641758, "loss": 0.0104, "step": 118320 }, { "epoch": 1.28, "learning_rate": 0.00010811766232081468, "loss": 0.0075, "step": 118330 }, { "epoch": 1.28, "learning_rate": 0.00010810144645521176, "loss": 0.0082, "step": 118340 }, { "epoch": 1.28, "learning_rate": 0.00010808523058960887, "loss": 0.0089, "step": 118350 }, { "epoch": 1.28, "learning_rate": 0.00010806901472400595, "loss": 0.0095, "step": 118360 }, { "epoch": 1.28, "learning_rate": 0.00010805279885840305, "loss": 0.0088, "step": 118370 }, { "epoch": 1.28, "learning_rate": 0.00010803658299280015, "loss": 0.009, "step": 118380 }, { "epoch": 1.28, "learning_rate": 0.00010802036712719724, "loss": 0.0095, "step": 118390 }, { "epoch": 1.28, "learning_rate": 0.00010800415126159433, "loss": 0.0077, "step": 118400 }, { "epoch": 1.28, "learning_rate": 0.00010798793539599143, "loss": 0.0087, "step": 118410 }, { "epoch": 1.28, "learning_rate": 0.00010797171953038852, "loss": 0.0088, "step": 118420 }, { "epoch": 1.28, "learning_rate": 0.00010795550366478562, "loss": 0.0076, "step": 118430 }, { "epoch": 1.28, "learning_rate": 0.0001079392877991827, "loss": 0.0096, "step": 118440 }, { "epoch": 1.28, "learning_rate": 0.00010792307193357981, "loss": 0.0082, "step": 118450 }, { "epoch": 1.28, "learning_rate": 0.00010790685606797689, "loss": 0.0088, "step": 118460 }, { "epoch": 1.28, "learning_rate": 0.000107890640202374, "loss": 0.0094, "step": 118470 }, { "epoch": 1.28, "learning_rate": 0.00010787442433677107, "loss": 0.0092, "step": 118480 }, { "epoch": 1.28, "learning_rate": 0.00010785820847116818, "loss": 0.0098, "step": 118490 }, { "epoch": 1.28, "learning_rate": 0.00010784199260556527, "loss": 0.0097, "step": 118500 }, { "epoch": 1.28, "learning_rate": 0.00010782577673996237, "loss": 0.008, "step": 118510 }, { "epoch": 1.28, "learning_rate": 0.00010780956087435946, "loss": 0.0096, "step": 118520 }, { "epoch": 1.28, "learning_rate": 0.00010779334500875657, "loss": 0.0085, "step": 118530 }, { "epoch": 1.28, "learning_rate": 0.00010777712914315364, "loss": 0.0086, "step": 118540 }, { "epoch": 1.28, "learning_rate": 0.00010776091327755075, "loss": 0.008, "step": 118550 }, { "epoch": 1.28, "learning_rate": 0.00010774469741194783, "loss": 0.0107, "step": 118560 }, { "epoch": 1.28, "learning_rate": 0.00010772848154634494, "loss": 0.0082, "step": 118570 }, { "epoch": 1.28, "learning_rate": 0.00010771226568074202, "loss": 0.0096, "step": 118580 }, { "epoch": 1.28, "learning_rate": 0.00010769604981513912, "loss": 0.011, "step": 118590 }, { "epoch": 1.28, "learning_rate": 0.00010767983394953621, "loss": 0.0085, "step": 118600 }, { "epoch": 1.28, "learning_rate": 0.00010766361808393331, "loss": 0.0109, "step": 118610 }, { "epoch": 1.28, "learning_rate": 0.0001076474022183304, "loss": 0.01, "step": 118620 }, { "epoch": 1.28, "learning_rate": 0.0001076311863527275, "loss": 0.0088, "step": 118630 }, { "epoch": 1.28, "learning_rate": 0.00010761497048712459, "loss": 0.0096, "step": 118640 }, { "epoch": 1.28, "learning_rate": 0.00010759875462152169, "loss": 0.008, "step": 118650 }, { "epoch": 1.28, "learning_rate": 0.00010758253875591877, "loss": 0.0099, "step": 118660 }, { "epoch": 1.28, "learning_rate": 0.00010756632289031588, "loss": 0.0089, "step": 118670 }, { "epoch": 1.28, "learning_rate": 0.00010755010702471296, "loss": 0.0075, "step": 118680 }, { "epoch": 1.28, "learning_rate": 0.00010753389115911006, "loss": 0.0095, "step": 118690 }, { "epoch": 1.28, "learning_rate": 0.00010751767529350717, "loss": 0.0113, "step": 118700 }, { "epoch": 1.28, "learning_rate": 0.00010750145942790425, "loss": 0.0097, "step": 118710 }, { "epoch": 1.28, "learning_rate": 0.00010748524356230135, "loss": 0.0094, "step": 118720 }, { "epoch": 1.28, "learning_rate": 0.00010746902769669843, "loss": 0.009, "step": 118730 }, { "epoch": 1.28, "learning_rate": 0.00010745281183109554, "loss": 0.0097, "step": 118740 }, { "epoch": 1.28, "learning_rate": 0.00010743659596549263, "loss": 0.0074, "step": 118750 }, { "epoch": 1.28, "learning_rate": 0.00010742038009988973, "loss": 0.0078, "step": 118760 }, { "epoch": 1.28, "learning_rate": 0.00010740416423428682, "loss": 0.0112, "step": 118770 }, { "epoch": 1.28, "learning_rate": 0.00010738794836868392, "loss": 0.0105, "step": 118780 }, { "epoch": 1.28, "learning_rate": 0.000107371732503081, "loss": 0.0076, "step": 118790 }, { "epoch": 1.28, "learning_rate": 0.00010735551663747811, "loss": 0.0118, "step": 118800 }, { "epoch": 1.28, "learning_rate": 0.00010733930077187519, "loss": 0.0107, "step": 118810 }, { "epoch": 1.28, "learning_rate": 0.0001073230849062723, "loss": 0.0083, "step": 118820 }, { "epoch": 1.28, "learning_rate": 0.00010730686904066937, "loss": 0.0086, "step": 118830 }, { "epoch": 1.28, "learning_rate": 0.00010729065317506648, "loss": 0.008, "step": 118840 }, { "epoch": 1.28, "learning_rate": 0.00010727443730946357, "loss": 0.0081, "step": 118850 }, { "epoch": 1.28, "learning_rate": 0.00010725822144386067, "loss": 0.0101, "step": 118860 }, { "epoch": 1.29, "learning_rate": 0.00010724200557825776, "loss": 0.0115, "step": 118870 }, { "epoch": 1.29, "learning_rate": 0.00010722578971265485, "loss": 0.0111, "step": 118880 }, { "epoch": 1.29, "learning_rate": 0.00010720957384705194, "loss": 0.0088, "step": 118890 }, { "epoch": 1.29, "learning_rate": 0.00010719335798144905, "loss": 0.0089, "step": 118900 }, { "epoch": 1.29, "learning_rate": 0.00010717714211584613, "loss": 0.0086, "step": 118910 }, { "epoch": 1.29, "learning_rate": 0.00010716092625024324, "loss": 0.0069, "step": 118920 }, { "epoch": 1.29, "learning_rate": 0.00010714471038464032, "loss": 0.0089, "step": 118930 }, { "epoch": 1.29, "learning_rate": 0.00010712849451903742, "loss": 0.0077, "step": 118940 }, { "epoch": 1.29, "learning_rate": 0.0001071122786534345, "loss": 0.0113, "step": 118950 }, { "epoch": 1.29, "learning_rate": 0.00010709606278783161, "loss": 0.0098, "step": 118960 }, { "epoch": 1.29, "learning_rate": 0.0001070798469222287, "loss": 0.01, "step": 118970 }, { "epoch": 1.29, "learning_rate": 0.00010706363105662579, "loss": 0.0109, "step": 118980 }, { "epoch": 1.29, "learning_rate": 0.00010704741519102289, "loss": 0.0088, "step": 118990 }, { "epoch": 1.29, "learning_rate": 0.00010703119932541999, "loss": 0.01, "step": 119000 }, { "epoch": 1.29, "eval_cer": 0.9215321461268126, "eval_loss": 0.007560289464890957, "eval_runtime": 121.1493, "eval_samples_per_second": 16.509, "eval_steps_per_second": 4.127, "step": 119000 }, { "epoch": 1.29, "learning_rate": 0.00010701498345981707, "loss": 0.0088, "step": 119010 }, { "epoch": 1.29, "learning_rate": 0.00010699876759421418, "loss": 0.0096, "step": 119020 }, { "epoch": 1.29, "learning_rate": 0.00010698255172861126, "loss": 0.0078, "step": 119030 }, { "epoch": 1.29, "learning_rate": 0.00010696633586300836, "loss": 0.009, "step": 119040 }, { "epoch": 1.29, "learning_rate": 0.00010695011999740544, "loss": 0.0066, "step": 119050 }, { "epoch": 1.29, "learning_rate": 0.00010693390413180255, "loss": 0.0113, "step": 119060 }, { "epoch": 1.29, "learning_rate": 0.00010691768826619964, "loss": 0.0108, "step": 119070 }, { "epoch": 1.29, "learning_rate": 0.00010690147240059673, "loss": 0.0105, "step": 119080 }, { "epoch": 1.29, "learning_rate": 0.00010688525653499383, "loss": 0.0095, "step": 119090 }, { "epoch": 1.29, "learning_rate": 0.00010686904066939092, "loss": 0.007, "step": 119100 }, { "epoch": 1.29, "learning_rate": 0.00010685282480378801, "loss": 0.0121, "step": 119110 }, { "epoch": 1.29, "learning_rate": 0.00010683660893818512, "loss": 0.009, "step": 119120 }, { "epoch": 1.29, "learning_rate": 0.0001068203930725822, "loss": 0.0088, "step": 119130 }, { "epoch": 1.29, "learning_rate": 0.0001068041772069793, "loss": 0.0105, "step": 119140 }, { "epoch": 1.29, "learning_rate": 0.00010678796134137638, "loss": 0.0138, "step": 119150 }, { "epoch": 1.29, "learning_rate": 0.00010677174547577349, "loss": 0.0078, "step": 119160 }, { "epoch": 1.29, "learning_rate": 0.00010675552961017058, "loss": 0.0094, "step": 119170 }, { "epoch": 1.29, "learning_rate": 0.00010673931374456768, "loss": 0.0101, "step": 119180 }, { "epoch": 1.29, "learning_rate": 0.00010672309787896477, "loss": 0.0094, "step": 119190 }, { "epoch": 1.29, "learning_rate": 0.00010670688201336186, "loss": 0.0094, "step": 119200 }, { "epoch": 1.29, "learning_rate": 0.00010669066614775895, "loss": 0.0103, "step": 119210 }, { "epoch": 1.29, "learning_rate": 0.00010667445028215606, "loss": 0.0092, "step": 119220 }, { "epoch": 1.29, "learning_rate": 0.00010665823441655314, "loss": 0.0085, "step": 119230 }, { "epoch": 1.29, "learning_rate": 0.00010664201855095025, "loss": 0.009, "step": 119240 }, { "epoch": 1.29, "learning_rate": 0.00010662580268534732, "loss": 0.0118, "step": 119250 }, { "epoch": 1.29, "learning_rate": 0.00010660958681974443, "loss": 0.0092, "step": 119260 }, { "epoch": 1.29, "learning_rate": 0.00010659337095414151, "loss": 0.0104, "step": 119270 }, { "epoch": 1.29, "learning_rate": 0.00010657715508853862, "loss": 0.0086, "step": 119280 }, { "epoch": 1.29, "learning_rate": 0.00010656093922293571, "loss": 0.0096, "step": 119290 }, { "epoch": 1.29, "learning_rate": 0.0001065447233573328, "loss": 0.0091, "step": 119300 }, { "epoch": 1.29, "learning_rate": 0.0001065285074917299, "loss": 0.0088, "step": 119310 }, { "epoch": 1.29, "learning_rate": 0.000106512291626127, "loss": 0.0102, "step": 119320 }, { "epoch": 1.29, "learning_rate": 0.00010649607576052408, "loss": 0.0108, "step": 119330 }, { "epoch": 1.29, "learning_rate": 0.00010647985989492119, "loss": 0.0118, "step": 119340 }, { "epoch": 1.29, "learning_rate": 0.00010646364402931827, "loss": 0.0119, "step": 119350 }, { "epoch": 1.29, "learning_rate": 0.00010644742816371537, "loss": 0.0091, "step": 119360 }, { "epoch": 1.29, "learning_rate": 0.00010643121229811245, "loss": 0.0091, "step": 119370 }, { "epoch": 1.29, "learning_rate": 0.00010641499643250956, "loss": 0.0092, "step": 119380 }, { "epoch": 1.29, "learning_rate": 0.00010639878056690665, "loss": 0.0098, "step": 119390 }, { "epoch": 1.29, "learning_rate": 0.00010638256470130374, "loss": 0.0086, "step": 119400 }, { "epoch": 1.29, "learning_rate": 0.00010636634883570085, "loss": 0.0104, "step": 119410 }, { "epoch": 1.29, "learning_rate": 0.00010635013297009793, "loss": 0.0109, "step": 119420 }, { "epoch": 1.29, "learning_rate": 0.00010633391710449503, "loss": 0.0103, "step": 119430 }, { "epoch": 1.29, "learning_rate": 0.00010631770123889213, "loss": 0.0087, "step": 119440 }, { "epoch": 1.29, "learning_rate": 0.00010630148537328922, "loss": 0.0117, "step": 119450 }, { "epoch": 1.29, "learning_rate": 0.00010628526950768631, "loss": 0.009, "step": 119460 }, { "epoch": 1.29, "learning_rate": 0.00010626905364208342, "loss": 0.0074, "step": 119470 }, { "epoch": 1.29, "learning_rate": 0.0001062528377764805, "loss": 0.0085, "step": 119480 }, { "epoch": 1.29, "learning_rate": 0.0001062366219108776, "loss": 0.0109, "step": 119490 }, { "epoch": 1.29, "learning_rate": 0.00010622040604527468, "loss": 0.0101, "step": 119500 }, { "epoch": 1.29, "learning_rate": 0.00010620419017967179, "loss": 0.0083, "step": 119510 }, { "epoch": 1.29, "learning_rate": 0.00010618797431406887, "loss": 0.0089, "step": 119520 }, { "epoch": 1.29, "learning_rate": 0.00010617175844846598, "loss": 0.0119, "step": 119530 }, { "epoch": 1.29, "learning_rate": 0.00010615554258286307, "loss": 0.0108, "step": 119540 }, { "epoch": 1.29, "learning_rate": 0.00010613932671726016, "loss": 0.0081, "step": 119550 }, { "epoch": 1.29, "learning_rate": 0.00010612311085165725, "loss": 0.0093, "step": 119560 }, { "epoch": 1.29, "learning_rate": 0.00010610689498605435, "loss": 0.0083, "step": 119570 }, { "epoch": 1.29, "learning_rate": 0.00010609067912045144, "loss": 0.0063, "step": 119580 }, { "epoch": 1.29, "learning_rate": 0.00010607446325484855, "loss": 0.009, "step": 119590 }, { "epoch": 1.29, "learning_rate": 0.00010605824738924562, "loss": 0.0125, "step": 119600 }, { "epoch": 1.29, "learning_rate": 0.00010604203152364273, "loss": 0.0083, "step": 119610 }, { "epoch": 1.29, "learning_rate": 0.00010602581565803981, "loss": 0.008, "step": 119620 }, { "epoch": 1.29, "learning_rate": 0.00010600959979243692, "loss": 0.0106, "step": 119630 }, { "epoch": 1.29, "learning_rate": 0.00010599338392683401, "loss": 0.0084, "step": 119640 }, { "epoch": 1.29, "learning_rate": 0.0001059771680612311, "loss": 0.007, "step": 119650 }, { "epoch": 1.29, "learning_rate": 0.0001059609521956282, "loss": 0.0086, "step": 119660 }, { "epoch": 1.29, "learning_rate": 0.00010594473633002529, "loss": 0.0106, "step": 119670 }, { "epoch": 1.29, "learning_rate": 0.00010592852046442238, "loss": 0.0086, "step": 119680 }, { "epoch": 1.29, "learning_rate": 0.00010591230459881949, "loss": 0.0086, "step": 119690 }, { "epoch": 1.29, "learning_rate": 0.00010589608873321657, "loss": 0.0092, "step": 119700 }, { "epoch": 1.29, "learning_rate": 0.00010587987286761367, "loss": 0.0071, "step": 119710 }, { "epoch": 1.29, "learning_rate": 0.00010586365700201075, "loss": 0.0103, "step": 119720 }, { "epoch": 1.29, "learning_rate": 0.00010584744113640786, "loss": 0.0098, "step": 119730 }, { "epoch": 1.29, "learning_rate": 0.00010583122527080494, "loss": 0.0084, "step": 119740 }, { "epoch": 1.29, "learning_rate": 0.00010581500940520204, "loss": 0.0102, "step": 119750 }, { "epoch": 1.29, "learning_rate": 0.00010579879353959914, "loss": 0.0109, "step": 119760 }, { "epoch": 1.29, "learning_rate": 0.00010578257767399623, "loss": 0.0086, "step": 119770 }, { "epoch": 1.29, "learning_rate": 0.00010576636180839332, "loss": 0.0099, "step": 119780 }, { "epoch": 1.29, "learning_rate": 0.00010575014594279043, "loss": 0.0107, "step": 119790 }, { "epoch": 1.3, "learning_rate": 0.0001057339300771875, "loss": 0.0093, "step": 119800 }, { "epoch": 1.3, "learning_rate": 0.00010571771421158461, "loss": 0.0089, "step": 119810 }, { "epoch": 1.3, "learning_rate": 0.00010570149834598169, "loss": 0.0091, "step": 119820 }, { "epoch": 1.3, "learning_rate": 0.0001056852824803788, "loss": 0.0081, "step": 119830 }, { "epoch": 1.3, "learning_rate": 0.00010566906661477588, "loss": 0.0096, "step": 119840 }, { "epoch": 1.3, "learning_rate": 0.00010565285074917298, "loss": 0.0109, "step": 119850 }, { "epoch": 1.3, "learning_rate": 0.00010563663488357008, "loss": 0.0075, "step": 119860 }, { "epoch": 1.3, "learning_rate": 0.00010562041901796717, "loss": 0.0121, "step": 119870 }, { "epoch": 1.3, "learning_rate": 0.00010560420315236426, "loss": 0.0092, "step": 119880 }, { "epoch": 1.3, "learning_rate": 0.00010558798728676135, "loss": 0.0102, "step": 119890 }, { "epoch": 1.3, "learning_rate": 0.00010557177142115845, "loss": 0.0121, "step": 119900 }, { "epoch": 1.3, "learning_rate": 0.00010555555555555555, "loss": 0.009, "step": 119910 }, { "epoch": 1.3, "learning_rate": 0.00010553933968995263, "loss": 0.0078, "step": 119920 }, { "epoch": 1.3, "learning_rate": 0.00010552312382434974, "loss": 0.0121, "step": 119930 }, { "epoch": 1.3, "learning_rate": 0.00010550690795874682, "loss": 0.0098, "step": 119940 }, { "epoch": 1.3, "learning_rate": 0.00010549069209314392, "loss": 0.0097, "step": 119950 }, { "epoch": 1.3, "learning_rate": 0.000105474476227541, "loss": 0.0117, "step": 119960 }, { "epoch": 1.3, "learning_rate": 0.00010545826036193811, "loss": 0.0067, "step": 119970 }, { "epoch": 1.3, "learning_rate": 0.0001054420444963352, "loss": 0.0085, "step": 119980 }, { "epoch": 1.3, "learning_rate": 0.0001054258286307323, "loss": 0.0082, "step": 119990 }, { "epoch": 1.3, "learning_rate": 0.00010540961276512939, "loss": 0.0102, "step": 120000 }, { "epoch": 1.3, "eval_cer": 0.921546912377071, "eval_loss": 0.007600127719342709, "eval_runtime": 121.3753, "eval_samples_per_second": 16.478, "eval_steps_per_second": 4.119, "step": 120000 }, { "epoch": 1.3, "learning_rate": 0.0001053933968995265, "loss": 0.0096, "step": 120010 }, { "epoch": 1.3, "learning_rate": 0.00010537718103392357, "loss": 0.0109, "step": 120020 }, { "epoch": 1.3, "learning_rate": 0.00010536096516832068, "loss": 0.0078, "step": 120030 }, { "epoch": 1.3, "learning_rate": 0.00010534474930271776, "loss": 0.0096, "step": 120040 }, { "epoch": 1.3, "learning_rate": 0.00010532853343711487, "loss": 0.0085, "step": 120050 }, { "epoch": 1.3, "learning_rate": 0.00010531231757151194, "loss": 0.0074, "step": 120060 }, { "epoch": 1.3, "learning_rate": 0.00010529610170590905, "loss": 0.0088, "step": 120070 }, { "epoch": 1.3, "learning_rate": 0.00010527988584030614, "loss": 0.0094, "step": 120080 }, { "epoch": 1.3, "learning_rate": 0.00010526366997470324, "loss": 0.0081, "step": 120090 }, { "epoch": 1.3, "learning_rate": 0.00010524745410910033, "loss": 0.0073, "step": 120100 }, { "epoch": 1.3, "learning_rate": 0.00010523123824349742, "loss": 0.0075, "step": 120110 }, { "epoch": 1.3, "learning_rate": 0.00010521502237789452, "loss": 0.0075, "step": 120120 }, { "epoch": 1.3, "learning_rate": 0.00010519880651229162, "loss": 0.0075, "step": 120130 }, { "epoch": 1.3, "learning_rate": 0.00010518259064668871, "loss": 0.0055, "step": 120140 }, { "epoch": 1.3, "learning_rate": 0.00010516637478108581, "loss": 0.0084, "step": 120150 }, { "epoch": 1.3, "learning_rate": 0.00010515015891548291, "loss": 0.0112, "step": 120160 }, { "epoch": 1.3, "learning_rate": 0.00010513394304987999, "loss": 0.0096, "step": 120170 }, { "epoch": 1.3, "learning_rate": 0.0001051177271842771, "loss": 0.0072, "step": 120180 }, { "epoch": 1.3, "learning_rate": 0.00010510151131867418, "loss": 0.0101, "step": 120190 }, { "epoch": 1.3, "learning_rate": 0.00010508529545307128, "loss": 0.0081, "step": 120200 }, { "epoch": 1.3, "learning_rate": 0.00010506907958746836, "loss": 0.0075, "step": 120210 }, { "epoch": 1.3, "learning_rate": 0.00010505286372186547, "loss": 0.0083, "step": 120220 }, { "epoch": 1.3, "learning_rate": 0.00010503664785626256, "loss": 0.0106, "step": 120230 }, { "epoch": 1.3, "learning_rate": 0.00010502043199065966, "loss": 0.0132, "step": 120240 }, { "epoch": 1.3, "learning_rate": 0.00010500421612505675, "loss": 0.0077, "step": 120250 }, { "epoch": 1.3, "learning_rate": 0.00010498800025945384, "loss": 0.0109, "step": 120260 }, { "epoch": 1.3, "learning_rate": 0.00010497178439385093, "loss": 0.0082, "step": 120270 }, { "epoch": 1.3, "learning_rate": 0.00010495556852824804, "loss": 0.0088, "step": 120280 }, { "epoch": 1.3, "learning_rate": 0.00010493935266264512, "loss": 0.0083, "step": 120290 }, { "epoch": 1.3, "learning_rate": 0.00010492313679704223, "loss": 0.0102, "step": 120300 }, { "epoch": 1.3, "learning_rate": 0.0001049069209314393, "loss": 0.0073, "step": 120310 }, { "epoch": 1.3, "learning_rate": 0.00010489070506583641, "loss": 0.0095, "step": 120320 }, { "epoch": 1.3, "learning_rate": 0.0001048744892002335, "loss": 0.0104, "step": 120330 }, { "epoch": 1.3, "learning_rate": 0.0001048582733346306, "loss": 0.0106, "step": 120340 }, { "epoch": 1.3, "learning_rate": 0.00010484205746902769, "loss": 0.0085, "step": 120350 }, { "epoch": 1.3, "learning_rate": 0.00010482584160342478, "loss": 0.0089, "step": 120360 }, { "epoch": 1.3, "learning_rate": 0.00010480962573782187, "loss": 0.0089, "step": 120370 }, { "epoch": 1.3, "learning_rate": 0.00010479340987221898, "loss": 0.0096, "step": 120380 }, { "epoch": 1.3, "learning_rate": 0.00010477719400661606, "loss": 0.008, "step": 120390 }, { "epoch": 1.3, "learning_rate": 0.00010476097814101317, "loss": 0.0103, "step": 120400 }, { "epoch": 1.3, "learning_rate": 0.00010474476227541025, "loss": 0.0103, "step": 120410 }, { "epoch": 1.3, "learning_rate": 0.00010472854640980735, "loss": 0.0084, "step": 120420 }, { "epoch": 1.3, "learning_rate": 0.00010471233054420443, "loss": 0.0083, "step": 120430 }, { "epoch": 1.3, "learning_rate": 0.00010469611467860154, "loss": 0.0103, "step": 120440 }, { "epoch": 1.3, "learning_rate": 0.00010467989881299863, "loss": 0.0086, "step": 120450 }, { "epoch": 1.3, "learning_rate": 0.00010466368294739572, "loss": 0.0073, "step": 120460 }, { "epoch": 1.3, "learning_rate": 0.00010464746708179282, "loss": 0.0076, "step": 120470 }, { "epoch": 1.3, "learning_rate": 0.00010463125121618992, "loss": 0.0087, "step": 120480 }, { "epoch": 1.3, "learning_rate": 0.000104615035350587, "loss": 0.0099, "step": 120490 }, { "epoch": 1.3, "learning_rate": 0.00010459881948498411, "loss": 0.0073, "step": 120500 }, { "epoch": 1.3, "learning_rate": 0.00010458260361938119, "loss": 0.0089, "step": 120510 }, { "epoch": 1.3, "learning_rate": 0.00010456638775377829, "loss": 0.0085, "step": 120520 }, { "epoch": 1.3, "learning_rate": 0.00010455017188817537, "loss": 0.01, "step": 120530 }, { "epoch": 1.3, "learning_rate": 0.00010453395602257248, "loss": 0.0098, "step": 120540 }, { "epoch": 1.3, "learning_rate": 0.00010451774015696957, "loss": 0.0093, "step": 120550 }, { "epoch": 1.3, "learning_rate": 0.00010450152429136666, "loss": 0.0093, "step": 120560 }, { "epoch": 1.3, "learning_rate": 0.00010448530842576376, "loss": 0.0104, "step": 120570 }, { "epoch": 1.3, "learning_rate": 0.00010446909256016085, "loss": 0.0071, "step": 120580 }, { "epoch": 1.3, "learning_rate": 0.00010445287669455794, "loss": 0.0087, "step": 120590 }, { "epoch": 1.3, "learning_rate": 0.00010443666082895505, "loss": 0.0102, "step": 120600 }, { "epoch": 1.3, "learning_rate": 0.00010442044496335213, "loss": 0.0083, "step": 120610 }, { "epoch": 1.3, "learning_rate": 0.00010440422909774923, "loss": 0.0077, "step": 120620 }, { "epoch": 1.3, "learning_rate": 0.00010438801323214631, "loss": 0.0083, "step": 120630 }, { "epoch": 1.3, "learning_rate": 0.00010437179736654342, "loss": 0.0093, "step": 120640 }, { "epoch": 1.3, "learning_rate": 0.00010435558150094051, "loss": 0.008, "step": 120650 }, { "epoch": 1.3, "learning_rate": 0.0001043393656353376, "loss": 0.0106, "step": 120660 }, { "epoch": 1.3, "learning_rate": 0.0001043231497697347, "loss": 0.008, "step": 120670 }, { "epoch": 1.3, "learning_rate": 0.00010430693390413179, "loss": 0.0092, "step": 120680 }, { "epoch": 1.3, "learning_rate": 0.00010429071803852888, "loss": 0.0095, "step": 120690 }, { "epoch": 1.3, "learning_rate": 0.00010427450217292599, "loss": 0.0085, "step": 120700 }, { "epoch": 1.3, "learning_rate": 0.00010425828630732307, "loss": 0.011, "step": 120710 }, { "epoch": 1.31, "learning_rate": 0.00010424207044172017, "loss": 0.0085, "step": 120720 }, { "epoch": 1.31, "learning_rate": 0.00010422585457611725, "loss": 0.01, "step": 120730 }, { "epoch": 1.31, "learning_rate": 0.00010420963871051436, "loss": 0.0092, "step": 120740 }, { "epoch": 1.31, "learning_rate": 0.00010419342284491144, "loss": 0.0077, "step": 120750 }, { "epoch": 1.31, "learning_rate": 0.00010417720697930855, "loss": 0.0085, "step": 120760 }, { "epoch": 1.31, "learning_rate": 0.00010416099111370564, "loss": 0.0086, "step": 120770 }, { "epoch": 1.31, "learning_rate": 0.00010414477524810273, "loss": 0.0071, "step": 120780 }, { "epoch": 1.31, "learning_rate": 0.00010412855938249982, "loss": 0.0078, "step": 120790 }, { "epoch": 1.31, "learning_rate": 0.00010411234351689693, "loss": 0.0079, "step": 120800 }, { "epoch": 1.31, "learning_rate": 0.00010409612765129401, "loss": 0.0098, "step": 120810 }, { "epoch": 1.31, "learning_rate": 0.00010407991178569112, "loss": 0.0085, "step": 120820 }, { "epoch": 1.31, "learning_rate": 0.0001040636959200882, "loss": 0.0107, "step": 120830 }, { "epoch": 1.31, "learning_rate": 0.0001040474800544853, "loss": 0.0089, "step": 120840 }, { "epoch": 1.31, "learning_rate": 0.00010403126418888241, "loss": 0.0096, "step": 120850 }, { "epoch": 1.31, "learning_rate": 0.00010401504832327949, "loss": 0.008, "step": 120860 }, { "epoch": 1.31, "learning_rate": 0.00010399883245767659, "loss": 0.008, "step": 120870 }, { "epoch": 1.31, "learning_rate": 0.00010398261659207367, "loss": 0.0106, "step": 120880 }, { "epoch": 1.31, "learning_rate": 0.00010396640072647078, "loss": 0.0082, "step": 120890 }, { "epoch": 1.31, "learning_rate": 0.00010395018486086786, "loss": 0.0088, "step": 120900 }, { "epoch": 1.31, "learning_rate": 0.00010393396899526496, "loss": 0.0073, "step": 120910 }, { "epoch": 1.31, "learning_rate": 0.00010391775312966206, "loss": 0.0099, "step": 120920 }, { "epoch": 1.31, "learning_rate": 0.00010390153726405915, "loss": 0.0114, "step": 120930 }, { "epoch": 1.31, "learning_rate": 0.00010388532139845624, "loss": 0.0099, "step": 120940 }, { "epoch": 1.31, "learning_rate": 0.00010386910553285335, "loss": 0.0091, "step": 120950 }, { "epoch": 1.31, "learning_rate": 0.00010385288966725043, "loss": 0.0083, "step": 120960 }, { "epoch": 1.31, "learning_rate": 0.00010383667380164753, "loss": 0.0135, "step": 120970 }, { "epoch": 1.31, "learning_rate": 0.00010382045793604461, "loss": 0.0088, "step": 120980 }, { "epoch": 1.31, "learning_rate": 0.00010380424207044172, "loss": 0.0101, "step": 120990 }, { "epoch": 1.31, "learning_rate": 0.0001037880262048388, "loss": 0.0106, "step": 121000 }, { "epoch": 1.31, "eval_cer": 0.9215330147297689, "eval_loss": 0.007609688676893711, "eval_runtime": 121.1646, "eval_samples_per_second": 16.506, "eval_steps_per_second": 4.127, "step": 121000 }, { "epoch": 1.31, "learning_rate": 0.0001037718103392359, "loss": 0.009, "step": 121010 }, { "epoch": 1.31, "learning_rate": 0.000103755594473633, "loss": 0.0085, "step": 121020 }, { "epoch": 1.31, "learning_rate": 0.00010373937860803009, "loss": 0.0074, "step": 121030 }, { "epoch": 1.31, "learning_rate": 0.00010372316274242718, "loss": 0.0067, "step": 121040 }, { "epoch": 1.31, "learning_rate": 0.00010370694687682428, "loss": 0.0101, "step": 121050 }, { "epoch": 1.31, "learning_rate": 0.00010369073101122137, "loss": 0.0088, "step": 121060 }, { "epoch": 1.31, "learning_rate": 0.00010367451514561847, "loss": 0.0095, "step": 121070 }, { "epoch": 1.31, "learning_rate": 0.00010365829928001555, "loss": 0.0093, "step": 121080 }, { "epoch": 1.31, "learning_rate": 0.00010364208341441266, "loss": 0.0091, "step": 121090 }, { "epoch": 1.31, "learning_rate": 0.00010362586754880974, "loss": 0.0101, "step": 121100 }, { "epoch": 1.31, "learning_rate": 0.00010360965168320685, "loss": 0.0113, "step": 121110 }, { "epoch": 1.31, "learning_rate": 0.00010359343581760392, "loss": 0.0085, "step": 121120 }, { "epoch": 1.31, "learning_rate": 0.00010357721995200103, "loss": 0.0081, "step": 121130 }, { "epoch": 1.31, "learning_rate": 0.00010356100408639812, "loss": 0.009, "step": 121140 }, { "epoch": 1.31, "learning_rate": 0.00010354478822079522, "loss": 0.0125, "step": 121150 }, { "epoch": 1.31, "learning_rate": 0.00010352857235519231, "loss": 0.0112, "step": 121160 }, { "epoch": 1.31, "learning_rate": 0.00010351235648958942, "loss": 0.0084, "step": 121170 }, { "epoch": 1.31, "learning_rate": 0.0001034961406239865, "loss": 0.0074, "step": 121180 }, { "epoch": 1.31, "learning_rate": 0.0001034799247583836, "loss": 0.0083, "step": 121190 }, { "epoch": 1.31, "learning_rate": 0.00010346370889278068, "loss": 0.0098, "step": 121200 }, { "epoch": 1.31, "learning_rate": 0.00010344749302717779, "loss": 0.0095, "step": 121210 }, { "epoch": 1.31, "learning_rate": 0.00010343127716157487, "loss": 0.0072, "step": 121220 }, { "epoch": 1.31, "learning_rate": 0.00010341506129597197, "loss": 0.0074, "step": 121230 }, { "epoch": 1.31, "learning_rate": 0.00010339884543036906, "loss": 0.0092, "step": 121240 }, { "epoch": 1.31, "learning_rate": 0.00010338262956476616, "loss": 0.0075, "step": 121250 }, { "epoch": 1.31, "learning_rate": 0.00010336641369916325, "loss": 0.0121, "step": 121260 }, { "epoch": 1.31, "learning_rate": 0.00010335019783356034, "loss": 0.0101, "step": 121270 }, { "epoch": 1.31, "learning_rate": 0.00010333398196795744, "loss": 0.0107, "step": 121280 }, { "epoch": 1.31, "learning_rate": 0.00010331776610235454, "loss": 0.0099, "step": 121290 }, { "epoch": 1.31, "learning_rate": 0.00010330155023675162, "loss": 0.0068, "step": 121300 }, { "epoch": 1.31, "learning_rate": 0.00010328533437114873, "loss": 0.01, "step": 121310 }, { "epoch": 1.31, "learning_rate": 0.00010326911850554581, "loss": 0.01, "step": 121320 }, { "epoch": 1.31, "learning_rate": 0.00010325290263994291, "loss": 0.011, "step": 121330 }, { "epoch": 1.31, "learning_rate": 0.00010323668677434, "loss": 0.011, "step": 121340 }, { "epoch": 1.31, "learning_rate": 0.0001032204709087371, "loss": 0.0081, "step": 121350 }, { "epoch": 1.31, "learning_rate": 0.00010320425504313419, "loss": 0.0096, "step": 121360 }, { "epoch": 1.31, "learning_rate": 0.00010318803917753128, "loss": 0.0093, "step": 121370 }, { "epoch": 1.31, "learning_rate": 0.00010317182331192838, "loss": 0.0101, "step": 121380 }, { "epoch": 1.31, "learning_rate": 0.00010315560744632548, "loss": 0.008, "step": 121390 }, { "epoch": 1.31, "learning_rate": 0.00010313939158072256, "loss": 0.0101, "step": 121400 }, { "epoch": 1.31, "learning_rate": 0.00010312317571511967, "loss": 0.009, "step": 121410 }, { "epoch": 1.31, "learning_rate": 0.00010310695984951675, "loss": 0.0088, "step": 121420 }, { "epoch": 1.31, "learning_rate": 0.00010309074398391385, "loss": 0.0103, "step": 121430 }, { "epoch": 1.31, "learning_rate": 0.00010307452811831093, "loss": 0.0089, "step": 121440 }, { "epoch": 1.31, "learning_rate": 0.00010305831225270804, "loss": 0.0078, "step": 121450 }, { "epoch": 1.31, "learning_rate": 0.00010304209638710513, "loss": 0.0082, "step": 121460 }, { "epoch": 1.31, "learning_rate": 0.00010302588052150223, "loss": 0.0119, "step": 121470 }, { "epoch": 1.31, "learning_rate": 0.00010300966465589932, "loss": 0.008, "step": 121480 }, { "epoch": 1.31, "learning_rate": 0.00010299344879029642, "loss": 0.0112, "step": 121490 }, { "epoch": 1.31, "learning_rate": 0.0001029772329246935, "loss": 0.0119, "step": 121500 }, { "epoch": 1.31, "learning_rate": 0.00010296101705909061, "loss": 0.0079, "step": 121510 }, { "epoch": 1.31, "learning_rate": 0.00010294480119348769, "loss": 0.0073, "step": 121520 }, { "epoch": 1.31, "learning_rate": 0.0001029285853278848, "loss": 0.0109, "step": 121530 }, { "epoch": 1.31, "learning_rate": 0.00010291236946228187, "loss": 0.0104, "step": 121540 }, { "epoch": 1.31, "learning_rate": 0.00010289615359667898, "loss": 0.0095, "step": 121550 }, { "epoch": 1.31, "learning_rate": 0.00010287993773107607, "loss": 0.0111, "step": 121560 }, { "epoch": 1.31, "learning_rate": 0.00010286372186547317, "loss": 0.0069, "step": 121570 }, { "epoch": 1.31, "learning_rate": 0.00010284750599987027, "loss": 0.0084, "step": 121580 }, { "epoch": 1.31, "learning_rate": 0.00010283129013426735, "loss": 0.0102, "step": 121590 }, { "epoch": 1.31, "learning_rate": 0.00010281507426866446, "loss": 0.0109, "step": 121600 }, { "epoch": 1.31, "learning_rate": 0.00010279885840306155, "loss": 0.0082, "step": 121610 }, { "epoch": 1.31, "learning_rate": 0.00010278264253745864, "loss": 0.0097, "step": 121620 }, { "epoch": 1.31, "learning_rate": 0.00010276642667185574, "loss": 0.0085, "step": 121630 }, { "epoch": 1.31, "learning_rate": 0.00010275021080625284, "loss": 0.0106, "step": 121640 }, { "epoch": 1.32, "learning_rate": 0.00010273399494064992, "loss": 0.0081, "step": 121650 }, { "epoch": 1.32, "learning_rate": 0.00010271777907504703, "loss": 0.01, "step": 121660 }, { "epoch": 1.32, "learning_rate": 0.00010270156320944411, "loss": 0.01, "step": 121670 }, { "epoch": 1.32, "learning_rate": 0.00010268534734384121, "loss": 0.0087, "step": 121680 }, { "epoch": 1.32, "learning_rate": 0.00010266913147823829, "loss": 0.0089, "step": 121690 }, { "epoch": 1.32, "learning_rate": 0.0001026529156126354, "loss": 0.0086, "step": 121700 }, { "epoch": 1.32, "learning_rate": 0.00010263669974703249, "loss": 0.0106, "step": 121710 }, { "epoch": 1.32, "learning_rate": 0.00010262048388142958, "loss": 0.0079, "step": 121720 }, { "epoch": 1.32, "learning_rate": 0.00010260426801582668, "loss": 0.0065, "step": 121730 }, { "epoch": 1.32, "learning_rate": 0.00010258805215022377, "loss": 0.0099, "step": 121740 }, { "epoch": 1.32, "learning_rate": 0.00010257183628462086, "loss": 0.0125, "step": 121750 }, { "epoch": 1.32, "learning_rate": 0.00010255562041901797, "loss": 0.0099, "step": 121760 }, { "epoch": 1.32, "learning_rate": 0.00010253940455341505, "loss": 0.0078, "step": 121770 }, { "epoch": 1.32, "learning_rate": 0.00010252318868781215, "loss": 0.0105, "step": 121780 }, { "epoch": 1.32, "learning_rate": 0.00010250697282220923, "loss": 0.0089, "step": 121790 }, { "epoch": 1.32, "learning_rate": 0.00010249075695660634, "loss": 0.0083, "step": 121800 }, { "epoch": 1.32, "learning_rate": 0.00010247454109100343, "loss": 0.0098, "step": 121810 }, { "epoch": 1.32, "learning_rate": 0.00010245832522540053, "loss": 0.0106, "step": 121820 }, { "epoch": 1.32, "learning_rate": 0.00010244210935979762, "loss": 0.0091, "step": 121830 }, { "epoch": 1.32, "learning_rate": 0.00010242589349419471, "loss": 0.0106, "step": 121840 }, { "epoch": 1.32, "learning_rate": 0.0001024096776285918, "loss": 0.0084, "step": 121850 }, { "epoch": 1.32, "learning_rate": 0.00010239346176298891, "loss": 0.0069, "step": 121860 }, { "epoch": 1.32, "learning_rate": 0.00010237724589738599, "loss": 0.0116, "step": 121870 }, { "epoch": 1.32, "learning_rate": 0.0001023610300317831, "loss": 0.0087, "step": 121880 }, { "epoch": 1.32, "learning_rate": 0.00010234481416618017, "loss": 0.0084, "step": 121890 }, { "epoch": 1.32, "learning_rate": 0.00010232859830057728, "loss": 0.0086, "step": 121900 }, { "epoch": 1.32, "learning_rate": 0.00010231238243497436, "loss": 0.009, "step": 121910 }, { "epoch": 1.32, "learning_rate": 0.00010229616656937147, "loss": 0.012, "step": 121920 }, { "epoch": 1.32, "learning_rate": 0.00010227995070376856, "loss": 0.0081, "step": 121930 }, { "epoch": 1.32, "learning_rate": 0.00010226373483816565, "loss": 0.0093, "step": 121940 }, { "epoch": 1.32, "learning_rate": 0.00010224751897256274, "loss": 0.0087, "step": 121950 }, { "epoch": 1.32, "learning_rate": 0.00010223130310695985, "loss": 0.0077, "step": 121960 }, { "epoch": 1.32, "learning_rate": 0.00010221508724135693, "loss": 0.0108, "step": 121970 }, { "epoch": 1.32, "learning_rate": 0.00010219887137575404, "loss": 0.0103, "step": 121980 }, { "epoch": 1.32, "learning_rate": 0.00010218265551015112, "loss": 0.0097, "step": 121990 }, { "epoch": 1.32, "learning_rate": 0.00010216643964454822, "loss": 0.0099, "step": 122000 }, { "epoch": 1.32, "eval_cer": 0.9215382263475072, "eval_loss": 0.007727743126451969, "eval_runtime": 121.0265, "eval_samples_per_second": 16.525, "eval_steps_per_second": 4.131, "step": 122000 }, { "epoch": 1.32, "learning_rate": 0.0001021502237789453, "loss": 0.0082, "step": 122010 }, { "epoch": 1.32, "learning_rate": 0.00010213400791334241, "loss": 0.0106, "step": 122020 }, { "epoch": 1.32, "learning_rate": 0.0001021177920477395, "loss": 0.0115, "step": 122030 }, { "epoch": 1.32, "learning_rate": 0.00010210157618213659, "loss": 0.0096, "step": 122040 }, { "epoch": 1.32, "learning_rate": 0.00010208536031653369, "loss": 0.0069, "step": 122050 }, { "epoch": 1.32, "learning_rate": 0.00010206914445093078, "loss": 0.013, "step": 122060 }, { "epoch": 1.32, "learning_rate": 0.00010205292858532787, "loss": 0.0087, "step": 122070 }, { "epoch": 1.32, "learning_rate": 0.00010203671271972498, "loss": 0.0085, "step": 122080 }, { "epoch": 1.32, "learning_rate": 0.00010202049685412206, "loss": 0.0107, "step": 122090 }, { "epoch": 1.32, "learning_rate": 0.00010200428098851916, "loss": 0.0108, "step": 122100 }, { "epoch": 1.32, "learning_rate": 0.00010198806512291624, "loss": 0.008, "step": 122110 }, { "epoch": 1.32, "learning_rate": 0.00010197184925731335, "loss": 0.0098, "step": 122120 }, { "epoch": 1.32, "learning_rate": 0.00010195563339171043, "loss": 0.0089, "step": 122130 }, { "epoch": 1.32, "learning_rate": 0.00010193941752610753, "loss": 0.0097, "step": 122140 }, { "epoch": 1.32, "learning_rate": 0.00010192320166050463, "loss": 0.0078, "step": 122150 }, { "epoch": 1.32, "learning_rate": 0.00010190698579490172, "loss": 0.0085, "step": 122160 }, { "epoch": 1.32, "learning_rate": 0.00010189076992929881, "loss": 0.009, "step": 122170 }, { "epoch": 1.32, "learning_rate": 0.00010187455406369592, "loss": 0.0086, "step": 122180 }, { "epoch": 1.32, "learning_rate": 0.000101858338198093, "loss": 0.0089, "step": 122190 }, { "epoch": 1.32, "learning_rate": 0.0001018421223324901, "loss": 0.0092, "step": 122200 }, { "epoch": 1.32, "learning_rate": 0.00010182590646688718, "loss": 0.0089, "step": 122210 }, { "epoch": 1.32, "learning_rate": 0.00010180969060128429, "loss": 0.0114, "step": 122220 }, { "epoch": 1.32, "learning_rate": 0.00010179347473568137, "loss": 0.0118, "step": 122230 }, { "epoch": 1.32, "learning_rate": 0.00010177725887007847, "loss": 0.01, "step": 122240 }, { "epoch": 1.32, "learning_rate": 0.00010176104300447557, "loss": 0.0086, "step": 122250 }, { "epoch": 1.32, "learning_rate": 0.00010174482713887266, "loss": 0.0106, "step": 122260 }, { "epoch": 1.32, "learning_rate": 0.00010172861127326975, "loss": 0.0078, "step": 122270 }, { "epoch": 1.32, "learning_rate": 0.00010171239540766685, "loss": 0.0107, "step": 122280 }, { "epoch": 1.32, "learning_rate": 0.00010169617954206395, "loss": 0.0071, "step": 122290 }, { "epoch": 1.32, "learning_rate": 0.00010167996367646104, "loss": 0.0093, "step": 122300 }, { "epoch": 1.32, "learning_rate": 0.00010166374781085814, "loss": 0.0068, "step": 122310 }, { "epoch": 1.32, "learning_rate": 0.00010164753194525523, "loss": 0.0076, "step": 122320 }, { "epoch": 1.32, "learning_rate": 0.00010163131607965234, "loss": 0.0074, "step": 122330 }, { "epoch": 1.32, "learning_rate": 0.00010161510021404942, "loss": 0.0095, "step": 122340 }, { "epoch": 1.32, "learning_rate": 0.00010159888434844652, "loss": 0.0087, "step": 122350 }, { "epoch": 1.32, "learning_rate": 0.0001015826684828436, "loss": 0.0076, "step": 122360 }, { "epoch": 1.32, "learning_rate": 0.00010156645261724071, "loss": 0.0073, "step": 122370 }, { "epoch": 1.32, "learning_rate": 0.00010155023675163779, "loss": 0.0072, "step": 122380 }, { "epoch": 1.32, "learning_rate": 0.00010153402088603489, "loss": 0.0088, "step": 122390 }, { "epoch": 1.32, "learning_rate": 0.00010151780502043199, "loss": 0.0101, "step": 122400 }, { "epoch": 1.32, "learning_rate": 0.00010150158915482908, "loss": 0.0073, "step": 122410 }, { "epoch": 1.32, "learning_rate": 0.00010148537328922617, "loss": 0.011, "step": 122420 }, { "epoch": 1.32, "learning_rate": 0.00010146915742362326, "loss": 0.0124, "step": 122430 }, { "epoch": 1.32, "learning_rate": 0.00010145294155802036, "loss": 0.0076, "step": 122440 }, { "epoch": 1.32, "learning_rate": 0.00010143672569241746, "loss": 0.0101, "step": 122450 }, { "epoch": 1.32, "learning_rate": 0.00010142050982681454, "loss": 0.0089, "step": 122460 }, { "epoch": 1.32, "learning_rate": 0.00010140429396121165, "loss": 0.0087, "step": 122470 }, { "epoch": 1.32, "learning_rate": 0.00010138807809560873, "loss": 0.0073, "step": 122480 }, { "epoch": 1.32, "learning_rate": 0.00010137186223000583, "loss": 0.0094, "step": 122490 }, { "epoch": 1.32, "learning_rate": 0.00010135564636440293, "loss": 0.0087, "step": 122500 }, { "epoch": 1.32, "learning_rate": 0.00010133943049880002, "loss": 0.0072, "step": 122510 }, { "epoch": 1.32, "learning_rate": 0.00010132321463319711, "loss": 0.0081, "step": 122520 }, { "epoch": 1.32, "learning_rate": 0.0001013069987675942, "loss": 0.0111, "step": 122530 }, { "epoch": 1.32, "learning_rate": 0.0001012907829019913, "loss": 0.0085, "step": 122540 }, { "epoch": 1.32, "learning_rate": 0.0001012745670363884, "loss": 0.0087, "step": 122550 }, { "epoch": 1.32, "learning_rate": 0.00010125835117078548, "loss": 0.0124, "step": 122560 }, { "epoch": 1.33, "learning_rate": 0.00010124213530518259, "loss": 0.0099, "step": 122570 }, { "epoch": 1.33, "learning_rate": 0.00010122591943957967, "loss": 0.009, "step": 122580 }, { "epoch": 1.33, "learning_rate": 0.00010120970357397678, "loss": 0.0086, "step": 122590 }, { "epoch": 1.33, "learning_rate": 0.00010119348770837385, "loss": 0.0075, "step": 122600 }, { "epoch": 1.33, "learning_rate": 0.00010117727184277096, "loss": 0.0077, "step": 122610 }, { "epoch": 1.33, "learning_rate": 0.00010116105597716805, "loss": 0.0109, "step": 122620 }, { "epoch": 1.33, "learning_rate": 0.00010114484011156515, "loss": 0.0076, "step": 122630 }, { "epoch": 1.33, "learning_rate": 0.00010112862424596224, "loss": 0.0088, "step": 122640 }, { "epoch": 1.33, "learning_rate": 0.00010111240838035935, "loss": 0.008, "step": 122650 }, { "epoch": 1.33, "learning_rate": 0.00010109619251475642, "loss": 0.0135, "step": 122660 }, { "epoch": 1.33, "learning_rate": 0.00010107997664915353, "loss": 0.0085, "step": 122670 }, { "epoch": 1.33, "learning_rate": 0.00010106376078355061, "loss": 0.009, "step": 122680 }, { "epoch": 1.33, "learning_rate": 0.00010104754491794772, "loss": 0.0118, "step": 122690 }, { "epoch": 1.33, "learning_rate": 0.0001010313290523448, "loss": 0.0075, "step": 122700 }, { "epoch": 1.33, "learning_rate": 0.0001010151131867419, "loss": 0.0077, "step": 122710 }, { "epoch": 1.33, "learning_rate": 0.000100998897321139, "loss": 0.0076, "step": 122720 }, { "epoch": 1.33, "learning_rate": 0.00010098268145553609, "loss": 0.0085, "step": 122730 }, { "epoch": 1.33, "learning_rate": 0.00010096646558993318, "loss": 0.0093, "step": 122740 }, { "epoch": 1.33, "learning_rate": 0.00010095024972433027, "loss": 0.0088, "step": 122750 }, { "epoch": 1.33, "learning_rate": 0.00010093403385872737, "loss": 0.0112, "step": 122760 }, { "epoch": 1.33, "learning_rate": 0.00010091781799312447, "loss": 0.0086, "step": 122770 }, { "epoch": 1.33, "learning_rate": 0.00010090160212752155, "loss": 0.009, "step": 122780 }, { "epoch": 1.33, "learning_rate": 0.00010088538626191866, "loss": 0.0076, "step": 122790 }, { "epoch": 1.33, "learning_rate": 0.00010086917039631574, "loss": 0.0095, "step": 122800 }, { "epoch": 1.33, "learning_rate": 0.00010085295453071284, "loss": 0.0088, "step": 122810 }, { "epoch": 1.33, "learning_rate": 0.00010083673866510994, "loss": 0.0073, "step": 122820 }, { "epoch": 1.33, "learning_rate": 0.00010082052279950703, "loss": 0.0083, "step": 122830 }, { "epoch": 1.33, "learning_rate": 0.00010080430693390412, "loss": 0.0104, "step": 122840 }, { "epoch": 1.33, "learning_rate": 0.00010078809106830121, "loss": 0.0087, "step": 122850 }, { "epoch": 1.33, "learning_rate": 0.0001007718752026983, "loss": 0.0104, "step": 122860 }, { "epoch": 1.33, "learning_rate": 0.00010075565933709541, "loss": 0.0105, "step": 122870 }, { "epoch": 1.33, "learning_rate": 0.00010073944347149249, "loss": 0.0089, "step": 122880 }, { "epoch": 1.33, "learning_rate": 0.0001007232276058896, "loss": 0.008, "step": 122890 }, { "epoch": 1.33, "learning_rate": 0.00010070701174028668, "loss": 0.0102, "step": 122900 }, { "epoch": 1.33, "learning_rate": 0.00010069079587468378, "loss": 0.0116, "step": 122910 }, { "epoch": 1.33, "learning_rate": 0.00010067458000908086, "loss": 0.0088, "step": 122920 }, { "epoch": 1.33, "learning_rate": 0.00010065836414347797, "loss": 0.0104, "step": 122930 }, { "epoch": 1.33, "learning_rate": 0.00010064214827787506, "loss": 0.0086, "step": 122940 }, { "epoch": 1.33, "learning_rate": 0.00010062593241227215, "loss": 0.0085, "step": 122950 }, { "epoch": 1.33, "learning_rate": 0.00010060971654666925, "loss": 0.0087, "step": 122960 }, { "epoch": 1.33, "learning_rate": 0.00010059350068106635, "loss": 0.0094, "step": 122970 }, { "epoch": 1.33, "learning_rate": 0.00010057728481546343, "loss": 0.0084, "step": 122980 }, { "epoch": 1.33, "learning_rate": 0.00010056106894986054, "loss": 0.0077, "step": 122990 }, { "epoch": 1.33, "learning_rate": 0.00010054485308425762, "loss": 0.0099, "step": 123000 }, { "epoch": 1.33, "eval_cer": 0.9215703646568931, "eval_loss": 0.007654594257473946, "eval_runtime": 121.0821, "eval_samples_per_second": 16.518, "eval_steps_per_second": 4.129, "step": 123000 }, { "epoch": 1.33, "learning_rate": 0.00010052863721865472, "loss": 0.0111, "step": 123010 }, { "epoch": 1.33, "learning_rate": 0.00010051242135305183, "loss": 0.0112, "step": 123020 }, { "epoch": 1.33, "learning_rate": 0.00010049620548744891, "loss": 0.0136, "step": 123030 }, { "epoch": 1.33, "learning_rate": 0.00010047998962184602, "loss": 0.0105, "step": 123040 }, { "epoch": 1.33, "learning_rate": 0.0001004637737562431, "loss": 0.006, "step": 123050 }, { "epoch": 1.33, "learning_rate": 0.0001004475578906402, "loss": 0.01, "step": 123060 }, { "epoch": 1.33, "learning_rate": 0.00010043134202503728, "loss": 0.0093, "step": 123070 }, { "epoch": 1.33, "learning_rate": 0.00010041512615943439, "loss": 0.0076, "step": 123080 }, { "epoch": 1.33, "learning_rate": 0.00010039891029383148, "loss": 0.0114, "step": 123090 }, { "epoch": 1.33, "learning_rate": 0.00010038269442822857, "loss": 0.0102, "step": 123100 }, { "epoch": 1.33, "learning_rate": 0.00010036647856262567, "loss": 0.0079, "step": 123110 }, { "epoch": 1.33, "learning_rate": 0.00010035026269702277, "loss": 0.0066, "step": 123120 }, { "epoch": 1.33, "learning_rate": 0.00010033404683141985, "loss": 0.0091, "step": 123130 }, { "epoch": 1.33, "learning_rate": 0.00010031783096581696, "loss": 0.0095, "step": 123140 }, { "epoch": 1.33, "learning_rate": 0.00010030161510021404, "loss": 0.0073, "step": 123150 }, { "epoch": 1.33, "learning_rate": 0.00010028539923461114, "loss": 0.0086, "step": 123160 }, { "epoch": 1.33, "learning_rate": 0.00010026918336900822, "loss": 0.0092, "step": 123170 }, { "epoch": 1.33, "learning_rate": 0.00010025296750340533, "loss": 0.0081, "step": 123180 }, { "epoch": 1.33, "learning_rate": 0.00010023675163780242, "loss": 0.0094, "step": 123190 }, { "epoch": 1.33, "learning_rate": 0.00010022053577219951, "loss": 0.0092, "step": 123200 }, { "epoch": 1.33, "learning_rate": 0.0001002043199065966, "loss": 0.0089, "step": 123210 }, { "epoch": 1.33, "learning_rate": 0.0001001881040409937, "loss": 0.0076, "step": 123220 }, { "epoch": 1.33, "learning_rate": 0.00010017188817539079, "loss": 0.0088, "step": 123230 }, { "epoch": 1.33, "learning_rate": 0.0001001556723097879, "loss": 0.01, "step": 123240 }, { "epoch": 1.33, "learning_rate": 0.00010013945644418498, "loss": 0.0079, "step": 123250 }, { "epoch": 1.33, "learning_rate": 0.00010012324057858208, "loss": 0.0112, "step": 123260 }, { "epoch": 1.33, "learning_rate": 0.00010010702471297916, "loss": 0.0068, "step": 123270 }, { "epoch": 1.33, "learning_rate": 0.00010009080884737627, "loss": 0.008, "step": 123280 }, { "epoch": 1.33, "learning_rate": 0.00010007459298177335, "loss": 0.0073, "step": 123290 }, { "epoch": 1.33, "learning_rate": 0.00010005837711617045, "loss": 0.0099, "step": 123300 }, { "epoch": 1.33, "learning_rate": 0.00010004216125056755, "loss": 0.0101, "step": 123310 }, { "epoch": 1.33, "learning_rate": 0.00010002594538496464, "loss": 0.0084, "step": 123320 }, { "epoch": 1.33, "learning_rate": 0.00010000972951936173, "loss": 0.0095, "step": 123330 }, { "epoch": 1.33, "learning_rate": 9.999351365375884e-05, "loss": 0.0082, "step": 123340 }, { "epoch": 1.33, "learning_rate": 9.997729778815592e-05, "loss": 0.0092, "step": 123350 }, { "epoch": 1.33, "learning_rate": 9.996108192255302e-05, "loss": 0.0071, "step": 123360 }, { "epoch": 1.33, "learning_rate": 9.99448660569501e-05, "loss": 0.0097, "step": 123370 }, { "epoch": 1.33, "learning_rate": 9.992865019134721e-05, "loss": 0.0081, "step": 123380 }, { "epoch": 1.33, "learning_rate": 9.991243432574429e-05, "loss": 0.0081, "step": 123390 }, { "epoch": 1.33, "learning_rate": 9.98962184601414e-05, "loss": 0.0107, "step": 123400 }, { "epoch": 1.33, "learning_rate": 9.988000259453849e-05, "loss": 0.0092, "step": 123410 }, { "epoch": 1.33, "learning_rate": 9.986378672893558e-05, "loss": 0.0077, "step": 123420 }, { "epoch": 1.33, "learning_rate": 9.984757086333267e-05, "loss": 0.0116, "step": 123430 }, { "epoch": 1.33, "learning_rate": 9.983135499772977e-05, "loss": 0.0065, "step": 123440 }, { "epoch": 1.33, "learning_rate": 9.981513913212686e-05, "loss": 0.0089, "step": 123450 }, { "epoch": 1.33, "learning_rate": 9.979892326652397e-05, "loss": 0.0102, "step": 123460 }, { "epoch": 1.33, "learning_rate": 9.978270740092104e-05, "loss": 0.0062, "step": 123470 }, { "epoch": 1.33, "learning_rate": 9.976649153531815e-05, "loss": 0.008, "step": 123480 }, { "epoch": 1.33, "learning_rate": 9.975027566971523e-05, "loss": 0.0086, "step": 123490 }, { "epoch": 1.34, "learning_rate": 9.973405980411234e-05, "loss": 0.0103, "step": 123500 }, { "epoch": 1.34, "learning_rate": 9.971784393850943e-05, "loss": 0.0078, "step": 123510 }, { "epoch": 1.34, "learning_rate": 9.970162807290652e-05, "loss": 0.009, "step": 123520 }, { "epoch": 1.34, "learning_rate": 9.968541220730361e-05, "loss": 0.0103, "step": 123530 }, { "epoch": 1.34, "learning_rate": 9.966919634170071e-05, "loss": 0.0076, "step": 123540 }, { "epoch": 1.34, "learning_rate": 9.96529804760978e-05, "loss": 0.0097, "step": 123550 }, { "epoch": 1.34, "learning_rate": 9.96367646104949e-05, "loss": 0.0082, "step": 123560 }, { "epoch": 1.34, "learning_rate": 9.962054874489199e-05, "loss": 0.0099, "step": 123570 }, { "epoch": 1.34, "learning_rate": 9.960433287928909e-05, "loss": 0.0097, "step": 123580 }, { "epoch": 1.34, "learning_rate": 9.958811701368617e-05, "loss": 0.0088, "step": 123590 }, { "epoch": 1.34, "learning_rate": 9.957190114808328e-05, "loss": 0.0086, "step": 123600 }, { "epoch": 1.34, "learning_rate": 9.955568528248036e-05, "loss": 0.01, "step": 123610 }, { "epoch": 1.34, "learning_rate": 9.953946941687746e-05, "loss": 0.0086, "step": 123620 }, { "epoch": 1.34, "learning_rate": 9.952325355127456e-05, "loss": 0.0106, "step": 123630 }, { "epoch": 1.34, "learning_rate": 9.950703768567165e-05, "loss": 0.0086, "step": 123640 }, { "epoch": 1.34, "learning_rate": 9.949082182006874e-05, "loss": 0.0105, "step": 123650 }, { "epoch": 1.34, "learning_rate": 9.947460595446585e-05, "loss": 0.0089, "step": 123660 }, { "epoch": 1.34, "learning_rate": 9.945839008886293e-05, "loss": 0.0083, "step": 123670 }, { "epoch": 1.34, "learning_rate": 9.944217422326003e-05, "loss": 0.0094, "step": 123680 }, { "epoch": 1.34, "learning_rate": 9.942595835765711e-05, "loss": 0.0082, "step": 123690 }, { "epoch": 1.34, "learning_rate": 9.940974249205422e-05, "loss": 0.0099, "step": 123700 }, { "epoch": 1.34, "learning_rate": 9.93935266264513e-05, "loss": 0.0079, "step": 123710 }, { "epoch": 1.34, "learning_rate": 9.93773107608484e-05, "loss": 0.0087, "step": 123720 }, { "epoch": 1.34, "learning_rate": 9.936109489524551e-05, "loss": 0.0104, "step": 123730 }, { "epoch": 1.34, "learning_rate": 9.934487902964259e-05, "loss": 0.01, "step": 123740 }, { "epoch": 1.34, "learning_rate": 9.93286631640397e-05, "loss": 0.0093, "step": 123750 }, { "epoch": 1.34, "learning_rate": 9.931244729843678e-05, "loss": 0.0099, "step": 123760 }, { "epoch": 1.34, "learning_rate": 9.929623143283388e-05, "loss": 0.007, "step": 123770 }, { "epoch": 1.34, "learning_rate": 9.928001556723097e-05, "loss": 0.0102, "step": 123780 }, { "epoch": 1.34, "learning_rate": 9.926379970162807e-05, "loss": 0.0074, "step": 123790 }, { "epoch": 1.34, "learning_rate": 9.924758383602516e-05, "loss": 0.0136, "step": 123800 }, { "epoch": 1.34, "learning_rate": 9.923136797042227e-05, "loss": 0.0096, "step": 123810 }, { "epoch": 1.34, "learning_rate": 9.921515210481935e-05, "loss": 0.0082, "step": 123820 }, { "epoch": 1.34, "learning_rate": 9.919893623921645e-05, "loss": 0.0099, "step": 123830 }, { "epoch": 1.34, "learning_rate": 9.918272037361353e-05, "loss": 0.0119, "step": 123840 }, { "epoch": 1.34, "learning_rate": 9.916650450801064e-05, "loss": 0.0076, "step": 123850 }, { "epoch": 1.34, "learning_rate": 9.915028864240772e-05, "loss": 0.0107, "step": 123860 }, { "epoch": 1.34, "learning_rate": 9.913407277680482e-05, "loss": 0.008, "step": 123870 }, { "epoch": 1.34, "learning_rate": 9.911785691120192e-05, "loss": 0.0087, "step": 123880 }, { "epoch": 1.34, "learning_rate": 9.910164104559901e-05, "loss": 0.0088, "step": 123890 }, { "epoch": 1.34, "learning_rate": 9.90854251799961e-05, "loss": 0.0095, "step": 123900 }, { "epoch": 1.34, "learning_rate": 9.90692093143932e-05, "loss": 0.0073, "step": 123910 }, { "epoch": 1.34, "learning_rate": 9.905299344879029e-05, "loss": 0.0074, "step": 123920 }, { "epoch": 1.34, "learning_rate": 9.903677758318739e-05, "loss": 0.0109, "step": 123930 }, { "epoch": 1.34, "learning_rate": 9.902056171758447e-05, "loss": 0.0109, "step": 123940 }, { "epoch": 1.34, "learning_rate": 9.900434585198158e-05, "loss": 0.0096, "step": 123950 }, { "epoch": 1.34, "learning_rate": 9.898812998637866e-05, "loss": 0.0078, "step": 123960 }, { "epoch": 1.34, "learning_rate": 9.897191412077576e-05, "loss": 0.009, "step": 123970 }, { "epoch": 1.34, "learning_rate": 9.895569825517286e-05, "loss": 0.008, "step": 123980 }, { "epoch": 1.34, "learning_rate": 9.893948238956995e-05, "loss": 0.0095, "step": 123990 }, { "epoch": 1.34, "learning_rate": 9.892326652396704e-05, "loss": 0.0105, "step": 124000 }, { "epoch": 1.34, "eval_cer": 0.9215547298036784, "eval_loss": 0.0075076548382639885, "eval_runtime": 121.2801, "eval_samples_per_second": 16.491, "eval_steps_per_second": 4.123, "step": 124000 }, { "epoch": 1.34, "learning_rate": 9.890705065836413e-05, "loss": 0.0077, "step": 124010 }, { "epoch": 1.34, "learning_rate": 9.889083479276123e-05, "loss": 0.0087, "step": 124020 }, { "epoch": 1.34, "learning_rate": 9.887461892715833e-05, "loss": 0.009, "step": 124030 }, { "epoch": 1.34, "learning_rate": 9.885840306155541e-05, "loss": 0.0078, "step": 124040 }, { "epoch": 1.34, "learning_rate": 9.884218719595252e-05, "loss": 0.0071, "step": 124050 }, { "epoch": 1.34, "learning_rate": 9.88259713303496e-05, "loss": 0.0106, "step": 124060 }, { "epoch": 1.34, "learning_rate": 9.88097554647467e-05, "loss": 0.0094, "step": 124070 }, { "epoch": 1.34, "learning_rate": 9.879353959914378e-05, "loss": 0.0104, "step": 124080 }, { "epoch": 1.34, "learning_rate": 9.877732373354089e-05, "loss": 0.0093, "step": 124090 }, { "epoch": 1.34, "learning_rate": 9.876110786793798e-05, "loss": 0.0096, "step": 124100 }, { "epoch": 1.34, "learning_rate": 9.874489200233508e-05, "loss": 0.0075, "step": 124110 }, { "epoch": 1.34, "learning_rate": 9.872867613673217e-05, "loss": 0.0083, "step": 124120 }, { "epoch": 1.34, "learning_rate": 9.871246027112927e-05, "loss": 0.0097, "step": 124130 }, { "epoch": 1.34, "learning_rate": 9.869624440552635e-05, "loss": 0.0088, "step": 124140 }, { "epoch": 1.34, "learning_rate": 9.868002853992346e-05, "loss": 0.0076, "step": 124150 }, { "epoch": 1.34, "learning_rate": 9.866381267432054e-05, "loss": 0.0108, "step": 124160 }, { "epoch": 1.34, "learning_rate": 9.864759680871765e-05, "loss": 0.0083, "step": 124170 }, { "epoch": 1.34, "learning_rate": 9.863138094311472e-05, "loss": 0.0084, "step": 124180 }, { "epoch": 1.34, "learning_rate": 9.861516507751183e-05, "loss": 0.0094, "step": 124190 }, { "epoch": 1.34, "learning_rate": 9.859894921190892e-05, "loss": 0.012, "step": 124200 }, { "epoch": 1.34, "learning_rate": 9.858273334630602e-05, "loss": 0.0093, "step": 124210 }, { "epoch": 1.34, "learning_rate": 9.856651748070311e-05, "loss": 0.0119, "step": 124220 }, { "epoch": 1.34, "learning_rate": 9.85503016151002e-05, "loss": 0.0124, "step": 124230 }, { "epoch": 1.34, "learning_rate": 9.85340857494973e-05, "loss": 0.0091, "step": 124240 }, { "epoch": 1.34, "learning_rate": 9.85178698838944e-05, "loss": 0.0088, "step": 124250 }, { "epoch": 1.34, "learning_rate": 9.850165401829148e-05, "loss": 0.0096, "step": 124260 }, { "epoch": 1.34, "learning_rate": 9.848543815268859e-05, "loss": 0.0087, "step": 124270 }, { "epoch": 1.34, "learning_rate": 9.846922228708567e-05, "loss": 0.0102, "step": 124280 }, { "epoch": 1.34, "learning_rate": 9.845300642148277e-05, "loss": 0.0095, "step": 124290 }, { "epoch": 1.34, "learning_rate": 9.843679055587985e-05, "loss": 0.0075, "step": 124300 }, { "epoch": 1.34, "learning_rate": 9.842057469027696e-05, "loss": 0.0095, "step": 124310 }, { "epoch": 1.34, "learning_rate": 9.840435882467405e-05, "loss": 0.0096, "step": 124320 }, { "epoch": 1.34, "learning_rate": 9.838814295907114e-05, "loss": 0.0081, "step": 124330 }, { "epoch": 1.34, "learning_rate": 9.837192709346824e-05, "loss": 0.0066, "step": 124340 }, { "epoch": 1.34, "learning_rate": 9.835571122786534e-05, "loss": 0.0072, "step": 124350 }, { "epoch": 1.34, "learning_rate": 9.833949536226242e-05, "loss": 0.0084, "step": 124360 }, { "epoch": 1.34, "learning_rate": 9.832327949665953e-05, "loss": 0.0085, "step": 124370 }, { "epoch": 1.34, "learning_rate": 9.83070636310566e-05, "loss": 0.0091, "step": 124380 }, { "epoch": 1.34, "learning_rate": 9.829084776545371e-05, "loss": 0.0082, "step": 124390 }, { "epoch": 1.34, "learning_rate": 9.827463189985079e-05, "loss": 0.0103, "step": 124400 }, { "epoch": 1.34, "learning_rate": 9.82584160342479e-05, "loss": 0.008, "step": 124410 }, { "epoch": 1.35, "learning_rate": 9.824220016864499e-05, "loss": 0.0088, "step": 124420 }, { "epoch": 1.35, "learning_rate": 9.822598430304208e-05, "loss": 0.008, "step": 124430 }, { "epoch": 1.35, "learning_rate": 9.820976843743919e-05, "loss": 0.0085, "step": 124440 }, { "epoch": 1.35, "learning_rate": 9.819355257183627e-05, "loss": 0.007, "step": 124450 }, { "epoch": 1.35, "learning_rate": 9.817733670623338e-05, "loss": 0.0082, "step": 124460 }, { "epoch": 1.35, "learning_rate": 9.816112084063047e-05, "loss": 0.0084, "step": 124470 }, { "epoch": 1.35, "learning_rate": 9.814490497502756e-05, "loss": 0.008, "step": 124480 }, { "epoch": 1.35, "learning_rate": 9.812868910942465e-05, "loss": 0.0091, "step": 124490 }, { "epoch": 1.35, "learning_rate": 9.811247324382176e-05, "loss": 0.0079, "step": 124500 }, { "epoch": 1.35, "learning_rate": 9.809625737821884e-05, "loss": 0.0101, "step": 124510 }, { "epoch": 1.35, "learning_rate": 9.808004151261595e-05, "loss": 0.0076, "step": 124520 }, { "epoch": 1.35, "learning_rate": 9.806382564701302e-05, "loss": 0.0067, "step": 124530 }, { "epoch": 1.35, "learning_rate": 9.804760978141013e-05, "loss": 0.0074, "step": 124540 }, { "epoch": 1.35, "learning_rate": 9.803139391580721e-05, "loss": 0.0083, "step": 124550 }, { "epoch": 1.35, "learning_rate": 9.801517805020432e-05, "loss": 0.0071, "step": 124560 }, { "epoch": 1.35, "learning_rate": 9.799896218460141e-05, "loss": 0.0097, "step": 124570 }, { "epoch": 1.35, "learning_rate": 9.79827463189985e-05, "loss": 0.0083, "step": 124580 }, { "epoch": 1.35, "learning_rate": 9.79665304533956e-05, "loss": 0.007, "step": 124590 }, { "epoch": 1.35, "learning_rate": 9.795031458779269e-05, "loss": 0.0096, "step": 124600 }, { "epoch": 1.35, "learning_rate": 9.793409872218978e-05, "loss": 0.0096, "step": 124610 }, { "epoch": 1.35, "learning_rate": 9.791788285658689e-05, "loss": 0.0091, "step": 124620 }, { "epoch": 1.35, "learning_rate": 9.790166699098397e-05, "loss": 0.0109, "step": 124630 }, { "epoch": 1.35, "learning_rate": 9.788545112538107e-05, "loss": 0.0093, "step": 124640 }, { "epoch": 1.35, "learning_rate": 9.786923525977815e-05, "loss": 0.0126, "step": 124650 }, { "epoch": 1.35, "learning_rate": 9.785301939417526e-05, "loss": 0.0113, "step": 124660 }, { "epoch": 1.35, "learning_rate": 9.783680352857235e-05, "loss": 0.0078, "step": 124670 }, { "epoch": 1.35, "learning_rate": 9.782058766296944e-05, "loss": 0.0119, "step": 124680 }, { "epoch": 1.35, "learning_rate": 9.780437179736654e-05, "loss": 0.01, "step": 124690 }, { "epoch": 1.35, "learning_rate": 9.778815593176363e-05, "loss": 0.0082, "step": 124700 }, { "epoch": 1.35, "learning_rate": 9.777194006616072e-05, "loss": 0.0132, "step": 124710 }, { "epoch": 1.35, "learning_rate": 9.775572420055783e-05, "loss": 0.0079, "step": 124720 }, { "epoch": 1.35, "learning_rate": 9.77395083349549e-05, "loss": 0.0094, "step": 124730 }, { "epoch": 1.35, "learning_rate": 9.772329246935201e-05, "loss": 0.0119, "step": 124740 }, { "epoch": 1.35, "learning_rate": 9.770707660374909e-05, "loss": 0.0108, "step": 124750 }, { "epoch": 1.35, "learning_rate": 9.76908607381462e-05, "loss": 0.0094, "step": 124760 }, { "epoch": 1.35, "learning_rate": 9.767464487254328e-05, "loss": 0.009, "step": 124770 }, { "epoch": 1.35, "learning_rate": 9.765842900694038e-05, "loss": 0.0084, "step": 124780 }, { "epoch": 1.35, "learning_rate": 9.764221314133748e-05, "loss": 0.0102, "step": 124790 }, { "epoch": 1.35, "learning_rate": 9.762599727573457e-05, "loss": 0.0094, "step": 124800 }, { "epoch": 1.35, "learning_rate": 9.760978141013166e-05, "loss": 0.0083, "step": 124810 }, { "epoch": 1.35, "learning_rate": 9.759356554452877e-05, "loss": 0.0091, "step": 124820 }, { "epoch": 1.35, "learning_rate": 9.757734967892585e-05, "loss": 0.0093, "step": 124830 }, { "epoch": 1.35, "learning_rate": 9.756113381332295e-05, "loss": 0.0092, "step": 124840 }, { "epoch": 1.35, "learning_rate": 9.754491794772003e-05, "loss": 0.0072, "step": 124850 }, { "epoch": 1.35, "learning_rate": 9.752870208211714e-05, "loss": 0.0119, "step": 124860 }, { "epoch": 1.35, "learning_rate": 9.751248621651422e-05, "loss": 0.0074, "step": 124870 }, { "epoch": 1.35, "learning_rate": 9.749627035091132e-05, "loss": 0.0105, "step": 124880 }, { "epoch": 1.35, "learning_rate": 9.748005448530842e-05, "loss": 0.0085, "step": 124890 }, { "epoch": 1.35, "learning_rate": 9.746383861970551e-05, "loss": 0.0077, "step": 124900 }, { "epoch": 1.35, "learning_rate": 9.74476227541026e-05, "loss": 0.0096, "step": 124910 }, { "epoch": 1.35, "learning_rate": 9.74314068884997e-05, "loss": 0.0081, "step": 124920 }, { "epoch": 1.35, "learning_rate": 9.741519102289679e-05, "loss": 0.0095, "step": 124930 }, { "epoch": 1.35, "learning_rate": 9.73989751572939e-05, "loss": 0.0082, "step": 124940 }, { "epoch": 1.35, "learning_rate": 9.738275929169097e-05, "loss": 0.0151, "step": 124950 }, { "epoch": 1.35, "learning_rate": 9.736654342608808e-05, "loss": 0.008, "step": 124960 }, { "epoch": 1.35, "learning_rate": 9.735032756048516e-05, "loss": 0.0099, "step": 124970 }, { "epoch": 1.35, "learning_rate": 9.733411169488227e-05, "loss": 0.0093, "step": 124980 }, { "epoch": 1.35, "learning_rate": 9.731789582927936e-05, "loss": 0.0104, "step": 124990 }, { "epoch": 1.35, "learning_rate": 9.730167996367645e-05, "loss": 0.0082, "step": 125000 }, { "epoch": 1.35, "eval_cer": 0.9215807878923696, "eval_loss": 0.007421437185257673, "eval_runtime": 121.2555, "eval_samples_per_second": 16.494, "eval_steps_per_second": 4.124, "step": 125000 }, { "epoch": 1.35, "learning_rate": 9.728546409807354e-05, "loss": 0.0076, "step": 125010 }, { "epoch": 1.35, "learning_rate": 9.726924823247064e-05, "loss": 0.0074, "step": 125020 }, { "epoch": 1.35, "learning_rate": 9.725303236686773e-05, "loss": 0.0084, "step": 125030 }, { "epoch": 1.35, "learning_rate": 9.723681650126484e-05, "loss": 0.0114, "step": 125040 }, { "epoch": 1.35, "learning_rate": 9.722060063566192e-05, "loss": 0.0091, "step": 125050 }, { "epoch": 1.35, "learning_rate": 9.720438477005902e-05, "loss": 0.0077, "step": 125060 }, { "epoch": 1.35, "learning_rate": 9.71881689044561e-05, "loss": 0.0093, "step": 125070 }, { "epoch": 1.35, "learning_rate": 9.717195303885321e-05, "loss": 0.0113, "step": 125080 }, { "epoch": 1.35, "learning_rate": 9.715573717325029e-05, "loss": 0.0081, "step": 125090 }, { "epoch": 1.35, "learning_rate": 9.713952130764739e-05, "loss": 0.0097, "step": 125100 }, { "epoch": 1.35, "learning_rate": 9.712330544204449e-05, "loss": 0.0097, "step": 125110 }, { "epoch": 1.35, "learning_rate": 9.710708957644158e-05, "loss": 0.0084, "step": 125120 }, { "epoch": 1.35, "learning_rate": 9.709087371083867e-05, "loss": 0.01, "step": 125130 }, { "epoch": 1.35, "learning_rate": 9.707465784523578e-05, "loss": 0.009, "step": 125140 }, { "epoch": 1.35, "learning_rate": 9.705844197963286e-05, "loss": 0.0088, "step": 125150 }, { "epoch": 1.35, "learning_rate": 9.704222611402996e-05, "loss": 0.0107, "step": 125160 }, { "epoch": 1.35, "learning_rate": 9.702601024842706e-05, "loss": 0.0098, "step": 125170 }, { "epoch": 1.35, "learning_rate": 9.700979438282415e-05, "loss": 0.0076, "step": 125180 }, { "epoch": 1.35, "learning_rate": 9.699357851722125e-05, "loss": 0.0095, "step": 125190 }, { "epoch": 1.35, "learning_rate": 9.697736265161833e-05, "loss": 0.0078, "step": 125200 }, { "epoch": 1.35, "learning_rate": 9.696114678601544e-05, "loss": 0.0108, "step": 125210 }, { "epoch": 1.35, "learning_rate": 9.694493092041252e-05, "loss": 0.0087, "step": 125220 }, { "epoch": 1.35, "learning_rate": 9.692871505480963e-05, "loss": 0.0126, "step": 125230 }, { "epoch": 1.35, "learning_rate": 9.69124991892067e-05, "loss": 0.0093, "step": 125240 }, { "epoch": 1.35, "learning_rate": 9.689628332360381e-05, "loss": 0.0088, "step": 125250 }, { "epoch": 1.35, "learning_rate": 9.68800674580009e-05, "loss": 0.0071, "step": 125260 }, { "epoch": 1.35, "learning_rate": 9.6863851592398e-05, "loss": 0.0123, "step": 125270 }, { "epoch": 1.35, "learning_rate": 9.684763572679509e-05, "loss": 0.0108, "step": 125280 }, { "epoch": 1.35, "learning_rate": 9.68314198611922e-05, "loss": 0.0067, "step": 125290 }, { "epoch": 1.35, "learning_rate": 9.681520399558927e-05, "loss": 0.0075, "step": 125300 }, { "epoch": 1.35, "learning_rate": 9.679898812998638e-05, "loss": 0.0075, "step": 125310 }, { "epoch": 1.35, "learning_rate": 9.678277226438346e-05, "loss": 0.0096, "step": 125320 }, { "epoch": 1.35, "learning_rate": 9.676655639878057e-05, "loss": 0.0083, "step": 125330 }, { "epoch": 1.35, "learning_rate": 9.675034053317765e-05, "loss": 0.0086, "step": 125340 }, { "epoch": 1.36, "learning_rate": 9.673412466757475e-05, "loss": 0.008, "step": 125350 }, { "epoch": 1.36, "learning_rate": 9.671790880197184e-05, "loss": 0.0076, "step": 125360 }, { "epoch": 1.36, "learning_rate": 9.670169293636894e-05, "loss": 0.01, "step": 125370 }, { "epoch": 1.36, "learning_rate": 9.668547707076603e-05, "loss": 0.0104, "step": 125380 }, { "epoch": 1.36, "learning_rate": 9.666926120516312e-05, "loss": 0.01, "step": 125390 }, { "epoch": 1.36, "learning_rate": 9.665304533956022e-05, "loss": 0.009, "step": 125400 }, { "epoch": 1.36, "learning_rate": 9.663682947395732e-05, "loss": 0.0098, "step": 125410 }, { "epoch": 1.36, "learning_rate": 9.66206136083544e-05, "loss": 0.0075, "step": 125420 }, { "epoch": 1.36, "learning_rate": 9.660439774275151e-05, "loss": 0.0089, "step": 125430 }, { "epoch": 1.36, "learning_rate": 9.658818187714859e-05, "loss": 0.0082, "step": 125440 }, { "epoch": 1.36, "learning_rate": 9.657196601154569e-05, "loss": 0.0063, "step": 125450 }, { "epoch": 1.36, "learning_rate": 9.655575014594277e-05, "loss": 0.0084, "step": 125460 }, { "epoch": 1.36, "learning_rate": 9.653953428033988e-05, "loss": 0.0099, "step": 125470 }, { "epoch": 1.36, "learning_rate": 9.652331841473697e-05, "loss": 0.0091, "step": 125480 }, { "epoch": 1.36, "learning_rate": 9.650710254913406e-05, "loss": 0.0113, "step": 125490 }, { "epoch": 1.36, "learning_rate": 9.649088668353116e-05, "loss": 0.0127, "step": 125500 }, { "epoch": 1.36, "learning_rate": 9.647467081792826e-05, "loss": 0.0092, "step": 125510 }, { "epoch": 1.36, "learning_rate": 9.645845495232534e-05, "loss": 0.0096, "step": 125520 }, { "epoch": 1.36, "learning_rate": 9.644223908672245e-05, "loss": 0.008, "step": 125530 }, { "epoch": 1.36, "learning_rate": 9.642602322111953e-05, "loss": 0.0102, "step": 125540 }, { "epoch": 1.36, "learning_rate": 9.640980735551663e-05, "loss": 0.0104, "step": 125550 }, { "epoch": 1.36, "learning_rate": 9.639359148991371e-05, "loss": 0.0088, "step": 125560 }, { "epoch": 1.36, "learning_rate": 9.637737562431082e-05, "loss": 0.0097, "step": 125570 }, { "epoch": 1.36, "learning_rate": 9.636115975870791e-05, "loss": 0.0079, "step": 125580 }, { "epoch": 1.36, "learning_rate": 9.6344943893105e-05, "loss": 0.0116, "step": 125590 }, { "epoch": 1.36, "learning_rate": 9.63287280275021e-05, "loss": 0.0084, "step": 125600 }, { "epoch": 1.36, "learning_rate": 9.631251216189919e-05, "loss": 0.0077, "step": 125610 }, { "epoch": 1.36, "learning_rate": 9.629629629629628e-05, "loss": 0.0097, "step": 125620 }, { "epoch": 1.36, "learning_rate": 9.628008043069339e-05, "loss": 0.0078, "step": 125630 }, { "epoch": 1.36, "learning_rate": 9.626386456509047e-05, "loss": 0.0145, "step": 125640 }, { "epoch": 1.36, "learning_rate": 9.624764869948757e-05, "loss": 0.0106, "step": 125650 }, { "epoch": 1.36, "learning_rate": 9.623143283388465e-05, "loss": 0.0083, "step": 125660 }, { "epoch": 1.36, "learning_rate": 9.621521696828176e-05, "loss": 0.0102, "step": 125670 }, { "epoch": 1.36, "learning_rate": 9.619900110267885e-05, "loss": 0.0103, "step": 125680 }, { "epoch": 1.36, "learning_rate": 9.618278523707595e-05, "loss": 0.0081, "step": 125690 }, { "epoch": 1.36, "learning_rate": 9.616656937147304e-05, "loss": 0.0094, "step": 125700 }, { "epoch": 1.36, "learning_rate": 9.615035350587013e-05, "loss": 0.0074, "step": 125710 }, { "epoch": 1.36, "learning_rate": 9.613413764026722e-05, "loss": 0.0067, "step": 125720 }, { "epoch": 1.36, "learning_rate": 9.611792177466433e-05, "loss": 0.0076, "step": 125730 }, { "epoch": 1.36, "learning_rate": 9.610170590906141e-05, "loss": 0.0087, "step": 125740 }, { "epoch": 1.36, "learning_rate": 9.608549004345852e-05, "loss": 0.0072, "step": 125750 }, { "epoch": 1.36, "learning_rate": 9.60692741778556e-05, "loss": 0.0074, "step": 125760 }, { "epoch": 1.36, "learning_rate": 9.60530583122527e-05, "loss": 0.0087, "step": 125770 }, { "epoch": 1.36, "learning_rate": 9.603684244664978e-05, "loss": 0.0074, "step": 125780 }, { "epoch": 1.36, "learning_rate": 9.602062658104689e-05, "loss": 0.0093, "step": 125790 }, { "epoch": 1.36, "learning_rate": 9.600441071544398e-05, "loss": 0.0098, "step": 125800 }, { "epoch": 1.36, "learning_rate": 9.598819484984107e-05, "loss": 0.0073, "step": 125810 }, { "epoch": 1.36, "learning_rate": 9.597197898423816e-05, "loss": 0.0102, "step": 125820 }, { "epoch": 1.36, "learning_rate": 9.595576311863527e-05, "loss": 0.0103, "step": 125830 }, { "epoch": 1.36, "learning_rate": 9.593954725303235e-05, "loss": 0.0089, "step": 125840 }, { "epoch": 1.36, "learning_rate": 9.592333138742946e-05, "loss": 0.0075, "step": 125850 }, { "epoch": 1.36, "learning_rate": 9.590711552182654e-05, "loss": 0.0075, "step": 125860 }, { "epoch": 1.36, "learning_rate": 9.589089965622364e-05, "loss": 0.0083, "step": 125870 }, { "epoch": 1.36, "learning_rate": 9.587468379062075e-05, "loss": 0.0059, "step": 125880 }, { "epoch": 1.36, "learning_rate": 9.585846792501783e-05, "loss": 0.0086, "step": 125890 }, { "epoch": 1.36, "learning_rate": 9.584225205941493e-05, "loss": 0.0085, "step": 125900 }, { "epoch": 1.36, "learning_rate": 9.582603619381201e-05, "loss": 0.0075, "step": 125910 }, { "epoch": 1.36, "learning_rate": 9.580982032820912e-05, "loss": 0.0104, "step": 125920 }, { "epoch": 1.36, "learning_rate": 9.57936044626062e-05, "loss": 0.0092, "step": 125930 }, { "epoch": 1.36, "learning_rate": 9.57773885970033e-05, "loss": 0.0088, "step": 125940 }, { "epoch": 1.36, "learning_rate": 9.57611727314004e-05, "loss": 0.0089, "step": 125950 }, { "epoch": 1.36, "learning_rate": 9.574495686579749e-05, "loss": 0.0093, "step": 125960 }, { "epoch": 1.36, "learning_rate": 9.572874100019458e-05, "loss": 0.012, "step": 125970 }, { "epoch": 1.36, "learning_rate": 9.571252513459169e-05, "loss": 0.0101, "step": 125980 }, { "epoch": 1.36, "learning_rate": 9.569630926898877e-05, "loss": 0.0113, "step": 125990 }, { "epoch": 1.36, "learning_rate": 9.568009340338587e-05, "loss": 0.0088, "step": 126000 }, { "epoch": 1.36, "eval_cer": 0.9215417007593327, "eval_loss": 0.007199176587164402, "eval_runtime": 121.2136, "eval_samples_per_second": 16.5, "eval_steps_per_second": 4.125, "step": 126000 }, { "epoch": 1.36, "learning_rate": 9.566387753778295e-05, "loss": 0.0101, "step": 126010 }, { "epoch": 1.36, "learning_rate": 9.564766167218006e-05, "loss": 0.0092, "step": 126020 }, { "epoch": 1.36, "learning_rate": 9.563144580657714e-05, "loss": 0.0098, "step": 126030 }, { "epoch": 1.36, "learning_rate": 9.561522994097425e-05, "loss": 0.0096, "step": 126040 }, { "epoch": 1.36, "learning_rate": 9.559901407537134e-05, "loss": 0.0077, "step": 126050 }, { "epoch": 1.36, "learning_rate": 9.558279820976843e-05, "loss": 0.0103, "step": 126060 }, { "epoch": 1.36, "learning_rate": 9.556658234416552e-05, "loss": 0.0099, "step": 126070 }, { "epoch": 1.36, "learning_rate": 9.555036647856262e-05, "loss": 0.0097, "step": 126080 }, { "epoch": 1.36, "learning_rate": 9.553415061295971e-05, "loss": 0.0085, "step": 126090 }, { "epoch": 1.36, "learning_rate": 9.551793474735682e-05, "loss": 0.0113, "step": 126100 }, { "epoch": 1.36, "learning_rate": 9.55017188817539e-05, "loss": 0.0067, "step": 126110 }, { "epoch": 1.36, "learning_rate": 9.5485503016151e-05, "loss": 0.0111, "step": 126120 }, { "epoch": 1.36, "learning_rate": 9.546928715054808e-05, "loss": 0.01, "step": 126130 }, { "epoch": 1.36, "learning_rate": 9.545307128494519e-05, "loss": 0.0098, "step": 126140 }, { "epoch": 1.36, "learning_rate": 9.543685541934228e-05, "loss": 0.0391, "step": 126150 }, { "epoch": 1.36, "learning_rate": 9.542063955373937e-05, "loss": 0.0083, "step": 126160 }, { "epoch": 1.36, "learning_rate": 9.540442368813647e-05, "loss": 0.0085, "step": 126170 }, { "epoch": 1.36, "learning_rate": 9.538820782253356e-05, "loss": 0.0089, "step": 126180 }, { "epoch": 1.36, "learning_rate": 9.537199195693065e-05, "loss": 0.0075, "step": 126190 }, { "epoch": 1.36, "learning_rate": 9.535577609132776e-05, "loss": 0.008, "step": 126200 }, { "epoch": 1.36, "learning_rate": 9.533956022572484e-05, "loss": 0.0106, "step": 126210 }, { "epoch": 1.36, "learning_rate": 9.532334436012194e-05, "loss": 0.0089, "step": 126220 }, { "epoch": 1.36, "learning_rate": 9.530712849451902e-05, "loss": 0.0087, "step": 126230 }, { "epoch": 1.36, "learning_rate": 9.529091262891613e-05, "loss": 0.0077, "step": 126240 }, { "epoch": 1.36, "learning_rate": 9.527469676331321e-05, "loss": 0.0097, "step": 126250 }, { "epoch": 1.36, "learning_rate": 9.525848089771031e-05, "loss": 0.0079, "step": 126260 }, { "epoch": 1.37, "learning_rate": 9.52422650321074e-05, "loss": 0.0082, "step": 126270 }, { "epoch": 1.37, "learning_rate": 9.52260491665045e-05, "loss": 0.0089, "step": 126280 }, { "epoch": 1.37, "learning_rate": 9.520983330090159e-05, "loss": 0.0073, "step": 126290 }, { "epoch": 1.37, "learning_rate": 9.51936174352987e-05, "loss": 0.0092, "step": 126300 }, { "epoch": 1.37, "learning_rate": 9.517740156969578e-05, "loss": 0.0077, "step": 126310 }, { "epoch": 1.37, "learning_rate": 9.516118570409288e-05, "loss": 0.0089, "step": 126320 }, { "epoch": 1.37, "learning_rate": 9.514496983848996e-05, "loss": 0.0086, "step": 126330 }, { "epoch": 1.37, "learning_rate": 9.512875397288707e-05, "loss": 0.007, "step": 126340 }, { "epoch": 1.37, "learning_rate": 9.511253810728415e-05, "loss": 0.0075, "step": 126350 }, { "epoch": 1.37, "learning_rate": 9.509632224168125e-05, "loss": 0.0075, "step": 126360 }, { "epoch": 1.37, "learning_rate": 9.508010637607835e-05, "loss": 0.0101, "step": 126370 }, { "epoch": 1.37, "learning_rate": 9.506389051047544e-05, "loss": 0.0086, "step": 126380 }, { "epoch": 1.37, "learning_rate": 9.504767464487253e-05, "loss": 0.01, "step": 126390 }, { "epoch": 1.37, "learning_rate": 9.503145877926963e-05, "loss": 0.0066, "step": 126400 }, { "epoch": 1.37, "learning_rate": 9.501524291366672e-05, "loss": 0.0075, "step": 126410 }, { "epoch": 1.37, "learning_rate": 9.499902704806382e-05, "loss": 0.0097, "step": 126420 }, { "epoch": 1.37, "learning_rate": 9.49828111824609e-05, "loss": 0.0074, "step": 126430 }, { "epoch": 1.37, "learning_rate": 9.496659531685801e-05, "loss": 0.0159, "step": 126440 }, { "epoch": 1.37, "learning_rate": 9.495037945125509e-05, "loss": 0.0072, "step": 126450 }, { "epoch": 1.37, "learning_rate": 9.49341635856522e-05, "loss": 0.0116, "step": 126460 }, { "epoch": 1.37, "learning_rate": 9.491794772004927e-05, "loss": 0.0091, "step": 126470 }, { "epoch": 1.37, "learning_rate": 9.490173185444638e-05, "loss": 0.0079, "step": 126480 }, { "epoch": 1.37, "learning_rate": 9.488551598884347e-05, "loss": 0.0078, "step": 126490 }, { "epoch": 1.37, "learning_rate": 9.486930012324057e-05, "loss": 0.0082, "step": 126500 }, { "epoch": 1.37, "learning_rate": 9.485308425763766e-05, "loss": 0.0079, "step": 126510 }, { "epoch": 1.37, "learning_rate": 9.483686839203477e-05, "loss": 0.0089, "step": 126520 }, { "epoch": 1.37, "learning_rate": 9.482065252643184e-05, "loss": 0.0094, "step": 126530 }, { "epoch": 1.37, "learning_rate": 9.480443666082895e-05, "loss": 0.0083, "step": 126540 }, { "epoch": 1.37, "learning_rate": 9.478822079522603e-05, "loss": 0.0112, "step": 126550 }, { "epoch": 1.37, "learning_rate": 9.477200492962314e-05, "loss": 0.0065, "step": 126560 }, { "epoch": 1.37, "learning_rate": 9.475578906402022e-05, "loss": 0.0099, "step": 126570 }, { "epoch": 1.37, "learning_rate": 9.473957319841732e-05, "loss": 0.0099, "step": 126580 }, { "epoch": 1.37, "learning_rate": 9.472335733281441e-05, "loss": 0.0081, "step": 126590 }, { "epoch": 1.37, "learning_rate": 9.470714146721151e-05, "loss": 0.0102, "step": 126600 }, { "epoch": 1.37, "learning_rate": 9.469092560160861e-05, "loss": 0.0096, "step": 126610 }, { "epoch": 1.37, "learning_rate": 9.467470973600569e-05, "loss": 0.0067, "step": 126620 }, { "epoch": 1.37, "learning_rate": 9.46584938704028e-05, "loss": 0.0097, "step": 126630 }, { "epoch": 1.37, "learning_rate": 9.464227800479989e-05, "loss": 0.0088, "step": 126640 }, { "epoch": 1.37, "learning_rate": 9.462606213919698e-05, "loss": 0.0081, "step": 126650 }, { "epoch": 1.37, "learning_rate": 9.460984627359408e-05, "loss": 0.008, "step": 126660 }, { "epoch": 1.37, "learning_rate": 9.459363040799118e-05, "loss": 0.0087, "step": 126670 }, { "epoch": 1.37, "learning_rate": 9.457741454238826e-05, "loss": 0.0082, "step": 126680 }, { "epoch": 1.37, "learning_rate": 9.456119867678537e-05, "loss": 0.0077, "step": 126690 }, { "epoch": 1.37, "learning_rate": 9.454498281118245e-05, "loss": 0.0087, "step": 126700 }, { "epoch": 1.37, "learning_rate": 9.452876694557955e-05, "loss": 0.0093, "step": 126710 }, { "epoch": 1.37, "learning_rate": 9.451255107997663e-05, "loss": 0.0083, "step": 126720 }, { "epoch": 1.37, "learning_rate": 9.449633521437374e-05, "loss": 0.0084, "step": 126730 }, { "epoch": 1.37, "learning_rate": 9.448011934877083e-05, "loss": 0.0099, "step": 126740 }, { "epoch": 1.37, "learning_rate": 9.446390348316793e-05, "loss": 0.0091, "step": 126750 }, { "epoch": 1.37, "learning_rate": 9.444768761756502e-05, "loss": 0.0098, "step": 126760 }, { "epoch": 1.37, "learning_rate": 9.443147175196212e-05, "loss": 0.0116, "step": 126770 }, { "epoch": 1.37, "learning_rate": 9.44152558863592e-05, "loss": 0.0083, "step": 126780 }, { "epoch": 1.37, "learning_rate": 9.439904002075631e-05, "loss": 0.0115, "step": 126790 }, { "epoch": 1.37, "learning_rate": 9.438282415515339e-05, "loss": 0.0081, "step": 126800 }, { "epoch": 1.37, "learning_rate": 9.43666082895505e-05, "loss": 0.0086, "step": 126810 }, { "epoch": 1.37, "learning_rate": 9.435039242394757e-05, "loss": 0.0056, "step": 126820 }, { "epoch": 1.37, "learning_rate": 9.433417655834468e-05, "loss": 0.0087, "step": 126830 }, { "epoch": 1.37, "learning_rate": 9.431796069274177e-05, "loss": 0.0083, "step": 126840 }, { "epoch": 1.37, "learning_rate": 9.430174482713887e-05, "loss": 0.0097, "step": 126850 }, { "epoch": 1.37, "learning_rate": 9.428552896153596e-05, "loss": 0.0099, "step": 126860 }, { "epoch": 1.37, "learning_rate": 9.426931309593305e-05, "loss": 0.0084, "step": 126870 }, { "epoch": 1.37, "learning_rate": 9.425309723033014e-05, "loss": 0.0084, "step": 126880 }, { "epoch": 1.37, "learning_rate": 9.423688136472725e-05, "loss": 0.0107, "step": 126890 }, { "epoch": 1.37, "learning_rate": 9.422066549912433e-05, "loss": 0.0092, "step": 126900 }, { "epoch": 1.37, "learning_rate": 9.420444963352144e-05, "loss": 0.0088, "step": 126910 }, { "epoch": 1.37, "learning_rate": 9.418823376791852e-05, "loss": 0.008, "step": 126920 }, { "epoch": 1.37, "learning_rate": 9.417201790231562e-05, "loss": 0.0091, "step": 126930 }, { "epoch": 1.37, "learning_rate": 9.41558020367127e-05, "loss": 0.0099, "step": 126940 }, { "epoch": 1.37, "learning_rate": 9.413958617110981e-05, "loss": 0.008, "step": 126950 }, { "epoch": 1.37, "learning_rate": 9.41233703055069e-05, "loss": 0.0114, "step": 126960 }, { "epoch": 1.37, "learning_rate": 9.410715443990399e-05, "loss": 0.0086, "step": 126970 }, { "epoch": 1.37, "learning_rate": 9.409093857430109e-05, "loss": 0.0095, "step": 126980 }, { "epoch": 1.37, "learning_rate": 9.407472270869819e-05, "loss": 0.0087, "step": 126990 }, { "epoch": 1.37, "learning_rate": 9.405850684309527e-05, "loss": 0.0077, "step": 127000 }, { "epoch": 1.37, "eval_cer": 0.9215199856854233, "eval_loss": 0.007032403256744146, "eval_runtime": 121.345, "eval_samples_per_second": 16.482, "eval_steps_per_second": 4.12, "step": 127000 }, { "epoch": 1.37, "learning_rate": 9.404229097749238e-05, "loss": 0.007, "step": 127010 }, { "epoch": 1.37, "learning_rate": 9.402607511188946e-05, "loss": 0.009, "step": 127020 }, { "epoch": 1.37, "learning_rate": 9.400985924628656e-05, "loss": 0.0084, "step": 127030 }, { "epoch": 1.37, "learning_rate": 9.399364338068364e-05, "loss": 0.0111, "step": 127040 }, { "epoch": 1.37, "learning_rate": 9.397742751508075e-05, "loss": 0.0109, "step": 127050 }, { "epoch": 1.37, "learning_rate": 9.396121164947784e-05, "loss": 0.0085, "step": 127060 }, { "epoch": 1.37, "learning_rate": 9.394499578387493e-05, "loss": 0.0078, "step": 127070 }, { "epoch": 1.37, "learning_rate": 9.392877991827203e-05, "loss": 0.0087, "step": 127080 }, { "epoch": 1.37, "learning_rate": 9.391256405266912e-05, "loss": 0.0084, "step": 127090 }, { "epoch": 1.37, "learning_rate": 9.389634818706621e-05, "loss": 0.0088, "step": 127100 }, { "epoch": 1.37, "learning_rate": 9.388013232146332e-05, "loss": 0.0087, "step": 127110 }, { "epoch": 1.37, "learning_rate": 9.38639164558604e-05, "loss": 0.0082, "step": 127120 }, { "epoch": 1.37, "learning_rate": 9.38477005902575e-05, "loss": 0.0089, "step": 127130 }, { "epoch": 1.37, "learning_rate": 9.383148472465458e-05, "loss": 0.011, "step": 127140 }, { "epoch": 1.37, "learning_rate": 9.381526885905169e-05, "loss": 0.01, "step": 127150 }, { "epoch": 1.37, "learning_rate": 9.379905299344878e-05, "loss": 0.009, "step": 127160 }, { "epoch": 1.37, "learning_rate": 9.378283712784587e-05, "loss": 0.0089, "step": 127170 }, { "epoch": 1.37, "learning_rate": 9.376662126224297e-05, "loss": 0.0068, "step": 127180 }, { "epoch": 1.37, "learning_rate": 9.375040539664006e-05, "loss": 0.0088, "step": 127190 }, { "epoch": 1.38, "learning_rate": 9.373418953103715e-05, "loss": 0.008, "step": 127200 }, { "epoch": 1.38, "learning_rate": 9.371797366543426e-05, "loss": 0.0124, "step": 127210 }, { "epoch": 1.38, "learning_rate": 9.370175779983134e-05, "loss": 0.0082, "step": 127220 }, { "epoch": 1.38, "learning_rate": 9.368554193422844e-05, "loss": 0.0124, "step": 127230 }, { "epoch": 1.38, "learning_rate": 9.366932606862552e-05, "loss": 0.0107, "step": 127240 }, { "epoch": 1.38, "learning_rate": 9.365311020302263e-05, "loss": 0.0081, "step": 127250 }, { "epoch": 1.38, "learning_rate": 9.363689433741971e-05, "loss": 0.0082, "step": 127260 }, { "epoch": 1.38, "learning_rate": 9.362067847181682e-05, "loss": 0.0085, "step": 127270 }, { "epoch": 1.38, "learning_rate": 9.360446260621391e-05, "loss": 0.0103, "step": 127280 }, { "epoch": 1.38, "learning_rate": 9.3588246740611e-05, "loss": 0.0059, "step": 127290 }, { "epoch": 1.38, "learning_rate": 9.35720308750081e-05, "loss": 0.01, "step": 127300 }, { "epoch": 1.38, "learning_rate": 9.35558150094052e-05, "loss": 0.0083, "step": 127310 }, { "epoch": 1.38, "learning_rate": 9.353959914380229e-05, "loss": 0.0104, "step": 127320 }, { "epoch": 1.38, "learning_rate": 9.352338327819939e-05, "loss": 0.0096, "step": 127330 }, { "epoch": 1.38, "learning_rate": 9.350716741259648e-05, "loss": 0.0074, "step": 127340 }, { "epoch": 1.38, "learning_rate": 9.349095154699357e-05, "loss": 0.0088, "step": 127350 }, { "epoch": 1.38, "learning_rate": 9.347473568139068e-05, "loss": 0.007, "step": 127360 }, { "epoch": 1.38, "learning_rate": 9.345851981578776e-05, "loss": 0.0088, "step": 127370 }, { "epoch": 1.38, "learning_rate": 9.344230395018486e-05, "loss": 0.0095, "step": 127380 }, { "epoch": 1.38, "learning_rate": 9.342608808458194e-05, "loss": 0.0074, "step": 127390 }, { "epoch": 1.38, "learning_rate": 9.340987221897905e-05, "loss": 0.0088, "step": 127400 }, { "epoch": 1.38, "learning_rate": 9.339365635337613e-05, "loss": 0.0096, "step": 127410 }, { "epoch": 1.38, "learning_rate": 9.337744048777323e-05, "loss": 0.0082, "step": 127420 }, { "epoch": 1.38, "learning_rate": 9.336122462217033e-05, "loss": 0.0072, "step": 127430 }, { "epoch": 1.38, "learning_rate": 9.334500875656742e-05, "loss": 0.0072, "step": 127440 }, { "epoch": 1.38, "learning_rate": 9.332879289096451e-05, "loss": 0.0074, "step": 127450 }, { "epoch": 1.38, "learning_rate": 9.331257702536162e-05, "loss": 0.0064, "step": 127460 }, { "epoch": 1.38, "learning_rate": 9.32963611597587e-05, "loss": 0.0113, "step": 127470 }, { "epoch": 1.38, "learning_rate": 9.32801452941558e-05, "loss": 0.0081, "step": 127480 }, { "epoch": 1.38, "learning_rate": 9.326392942855288e-05, "loss": 0.0072, "step": 127490 }, { "epoch": 1.38, "learning_rate": 9.324771356294999e-05, "loss": 0.0075, "step": 127500 }, { "epoch": 1.38, "learning_rate": 9.323149769734707e-05, "loss": 0.0072, "step": 127510 }, { "epoch": 1.38, "learning_rate": 9.321528183174418e-05, "loss": 0.0083, "step": 127520 }, { "epoch": 1.38, "learning_rate": 9.319906596614127e-05, "loss": 0.0088, "step": 127530 }, { "epoch": 1.38, "learning_rate": 9.318285010053836e-05, "loss": 0.0076, "step": 127540 }, { "epoch": 1.38, "learning_rate": 9.316663423493545e-05, "loss": 0.0089, "step": 127550 }, { "epoch": 1.38, "learning_rate": 9.315041836933255e-05, "loss": 0.0096, "step": 127560 }, { "epoch": 1.38, "learning_rate": 9.313420250372964e-05, "loss": 0.0089, "step": 127570 }, { "epoch": 1.38, "learning_rate": 9.311798663812675e-05, "loss": 0.0063, "step": 127580 }, { "epoch": 1.38, "learning_rate": 9.310177077252382e-05, "loss": 0.0094, "step": 127590 }, { "epoch": 1.38, "learning_rate": 9.308555490692093e-05, "loss": 0.0092, "step": 127600 }, { "epoch": 1.38, "learning_rate": 9.306933904131801e-05, "loss": 0.0101, "step": 127610 }, { "epoch": 1.38, "learning_rate": 9.305312317571512e-05, "loss": 0.01, "step": 127620 }, { "epoch": 1.38, "learning_rate": 9.30369073101122e-05, "loss": 0.0081, "step": 127630 }, { "epoch": 1.38, "learning_rate": 9.30206914445093e-05, "loss": 0.0096, "step": 127640 }, { "epoch": 1.38, "learning_rate": 9.30044755789064e-05, "loss": 0.0078, "step": 127650 }, { "epoch": 1.38, "learning_rate": 9.298825971330349e-05, "loss": 0.0144, "step": 127660 }, { "epoch": 1.38, "learning_rate": 9.297204384770058e-05, "loss": 0.009, "step": 127670 }, { "epoch": 1.38, "learning_rate": 9.295582798209769e-05, "loss": 0.008, "step": 127680 }, { "epoch": 1.38, "learning_rate": 9.293961211649477e-05, "loss": 0.0072, "step": 127690 }, { "epoch": 1.38, "learning_rate": 9.292339625089187e-05, "loss": 0.0077, "step": 127700 }, { "epoch": 1.38, "learning_rate": 9.290718038528895e-05, "loss": 0.0089, "step": 127710 }, { "epoch": 1.38, "learning_rate": 9.289096451968606e-05, "loss": 0.0096, "step": 127720 }, { "epoch": 1.38, "learning_rate": 9.287474865408314e-05, "loss": 0.0093, "step": 127730 }, { "epoch": 1.38, "learning_rate": 9.285853278848024e-05, "loss": 0.007, "step": 127740 }, { "epoch": 1.38, "learning_rate": 9.284231692287734e-05, "loss": 0.0101, "step": 127750 }, { "epoch": 1.38, "learning_rate": 9.282610105727443e-05, "loss": 0.0074, "step": 127760 }, { "epoch": 1.38, "learning_rate": 9.280988519167152e-05, "loss": 0.0094, "step": 127770 }, { "epoch": 1.38, "learning_rate": 9.279366932606863e-05, "loss": 0.015, "step": 127780 }, { "epoch": 1.38, "learning_rate": 9.27774534604657e-05, "loss": 0.0079, "step": 127790 }, { "epoch": 1.38, "learning_rate": 9.276123759486281e-05, "loss": 0.0072, "step": 127800 }, { "epoch": 1.38, "learning_rate": 9.274502172925989e-05, "loss": 0.0075, "step": 127810 }, { "epoch": 1.38, "learning_rate": 9.2728805863657e-05, "loss": 0.0098, "step": 127820 }, { "epoch": 1.38, "learning_rate": 9.271258999805408e-05, "loss": 0.0063, "step": 127830 }, { "epoch": 1.38, "learning_rate": 9.269637413245118e-05, "loss": 0.0076, "step": 127840 }, { "epoch": 1.38, "learning_rate": 9.268015826684828e-05, "loss": 0.0086, "step": 127850 }, { "epoch": 1.38, "learning_rate": 9.266394240124537e-05, "loss": 0.0081, "step": 127860 }, { "epoch": 1.38, "learning_rate": 9.264772653564246e-05, "loss": 0.009, "step": 127870 }, { "epoch": 1.38, "learning_rate": 9.263151067003955e-05, "loss": 0.0089, "step": 127880 }, { "epoch": 1.38, "learning_rate": 9.261529480443665e-05, "loss": 0.0107, "step": 127890 }, { "epoch": 1.38, "learning_rate": 9.259907893883375e-05, "loss": 0.0085, "step": 127900 }, { "epoch": 1.38, "learning_rate": 9.258286307323083e-05, "loss": 0.0091, "step": 127910 }, { "epoch": 1.38, "learning_rate": 9.256664720762794e-05, "loss": 0.0074, "step": 127920 }, { "epoch": 1.38, "learning_rate": 9.255043134202502e-05, "loss": 0.0083, "step": 127930 }, { "epoch": 1.38, "learning_rate": 9.253421547642212e-05, "loss": 0.0072, "step": 127940 }, { "epoch": 1.38, "learning_rate": 9.25179996108192e-05, "loss": 0.009, "step": 127950 }, { "epoch": 1.38, "learning_rate": 9.250178374521631e-05, "loss": 0.0074, "step": 127960 }, { "epoch": 1.38, "learning_rate": 9.24855678796134e-05, "loss": 0.0101, "step": 127970 }, { "epoch": 1.38, "learning_rate": 9.24693520140105e-05, "loss": 0.0096, "step": 127980 }, { "epoch": 1.38, "learning_rate": 9.245313614840759e-05, "loss": 0.0076, "step": 127990 }, { "epoch": 1.38, "learning_rate": 9.24369202828047e-05, "loss": 0.0063, "step": 128000 }, { "epoch": 1.38, "eval_cer": 0.9215738390687187, "eval_loss": 0.007414136081933975, "eval_runtime": 121.0821, "eval_samples_per_second": 16.518, "eval_steps_per_second": 4.129, "step": 128000 }, { "epoch": 1.38, "learning_rate": 9.242070441720177e-05, "loss": 0.0089, "step": 128010 }, { "epoch": 1.38, "learning_rate": 9.240448855159888e-05, "loss": 0.0094, "step": 128020 }, { "epoch": 1.38, "learning_rate": 9.238827268599596e-05, "loss": 0.0079, "step": 128030 }, { "epoch": 1.38, "learning_rate": 9.237205682039307e-05, "loss": 0.0095, "step": 128040 }, { "epoch": 1.38, "learning_rate": 9.235584095479017e-05, "loss": 0.0091, "step": 128050 }, { "epoch": 1.38, "learning_rate": 9.233962508918725e-05, "loss": 0.0102, "step": 128060 }, { "epoch": 1.38, "learning_rate": 9.232340922358436e-05, "loss": 0.0086, "step": 128070 }, { "epoch": 1.38, "learning_rate": 9.230719335798144e-05, "loss": 0.0095, "step": 128080 }, { "epoch": 1.38, "learning_rate": 9.229097749237854e-05, "loss": 0.0081, "step": 128090 }, { "epoch": 1.38, "learning_rate": 9.227476162677562e-05, "loss": 0.0107, "step": 128100 }, { "epoch": 1.38, "learning_rate": 9.225854576117273e-05, "loss": 0.01, "step": 128110 }, { "epoch": 1.39, "learning_rate": 9.224232989556982e-05, "loss": 0.0076, "step": 128120 }, { "epoch": 1.39, "learning_rate": 9.222611402996691e-05, "loss": 0.0086, "step": 128130 }, { "epoch": 1.39, "learning_rate": 9.2209898164364e-05, "loss": 0.0089, "step": 128140 }, { "epoch": 1.39, "learning_rate": 9.219368229876111e-05, "loss": 0.0096, "step": 128150 }, { "epoch": 1.39, "learning_rate": 9.217746643315819e-05, "loss": 0.0081, "step": 128160 }, { "epoch": 1.39, "learning_rate": 9.21612505675553e-05, "loss": 0.0089, "step": 128170 }, { "epoch": 1.39, "learning_rate": 9.214503470195238e-05, "loss": 0.008, "step": 128180 }, { "epoch": 1.39, "learning_rate": 9.212881883634948e-05, "loss": 0.0079, "step": 128190 }, { "epoch": 1.39, "learning_rate": 9.211260297074656e-05, "loss": 0.0084, "step": 128200 }, { "epoch": 1.39, "learning_rate": 9.209638710514367e-05, "loss": 0.0127, "step": 128210 }, { "epoch": 1.39, "learning_rate": 9.208017123954076e-05, "loss": 0.0084, "step": 128220 }, { "epoch": 1.39, "learning_rate": 9.206395537393785e-05, "loss": 0.0064, "step": 128230 }, { "epoch": 1.39, "learning_rate": 9.204773950833495e-05, "loss": 0.0077, "step": 128240 }, { "epoch": 1.39, "learning_rate": 9.203152364273204e-05, "loss": 0.0083, "step": 128250 }, { "epoch": 1.39, "learning_rate": 9.201530777712913e-05, "loss": 0.0083, "step": 128260 }, { "epoch": 1.39, "learning_rate": 9.199909191152624e-05, "loss": 0.0068, "step": 128270 }, { "epoch": 1.39, "learning_rate": 9.198287604592332e-05, "loss": 0.0063, "step": 128280 }, { "epoch": 1.39, "learning_rate": 9.196666018032042e-05, "loss": 0.008, "step": 128290 }, { "epoch": 1.39, "learning_rate": 9.19504443147175e-05, "loss": 0.0098, "step": 128300 }, { "epoch": 1.39, "learning_rate": 9.193422844911461e-05, "loss": 0.0083, "step": 128310 }, { "epoch": 1.39, "learning_rate": 9.19180125835117e-05, "loss": 0.0093, "step": 128320 }, { "epoch": 1.39, "learning_rate": 9.19017967179088e-05, "loss": 0.0088, "step": 128330 }, { "epoch": 1.39, "learning_rate": 9.188558085230589e-05, "loss": 0.0091, "step": 128340 }, { "epoch": 1.39, "learning_rate": 9.186936498670298e-05, "loss": 0.0074, "step": 128350 }, { "epoch": 1.39, "learning_rate": 9.185314912110007e-05, "loss": 0.0074, "step": 128360 }, { "epoch": 1.39, "learning_rate": 9.183693325549718e-05, "loss": 0.0102, "step": 128370 }, { "epoch": 1.39, "learning_rate": 9.182071738989426e-05, "loss": 0.0076, "step": 128380 }, { "epoch": 1.39, "learning_rate": 9.180450152429137e-05, "loss": 0.0091, "step": 128390 }, { "epoch": 1.39, "learning_rate": 9.178828565868844e-05, "loss": 0.0143, "step": 128400 }, { "epoch": 1.39, "learning_rate": 9.177206979308555e-05, "loss": 0.0101, "step": 128410 }, { "epoch": 1.39, "learning_rate": 9.175585392748263e-05, "loss": 0.0108, "step": 128420 }, { "epoch": 1.39, "learning_rate": 9.173963806187974e-05, "loss": 0.0083, "step": 128430 }, { "epoch": 1.39, "learning_rate": 9.172342219627683e-05, "loss": 0.0088, "step": 128440 }, { "epoch": 1.39, "learning_rate": 9.170720633067392e-05, "loss": 0.008, "step": 128450 }, { "epoch": 1.39, "learning_rate": 9.169099046507102e-05, "loss": 0.0067, "step": 128460 }, { "epoch": 1.39, "learning_rate": 9.167477459946812e-05, "loss": 0.0089, "step": 128470 }, { "epoch": 1.39, "learning_rate": 9.16585587338652e-05, "loss": 0.0112, "step": 128480 }, { "epoch": 1.39, "learning_rate": 9.164234286826231e-05, "loss": 0.0071, "step": 128490 }, { "epoch": 1.39, "learning_rate": 9.162612700265939e-05, "loss": 0.0112, "step": 128500 }, { "epoch": 1.39, "learning_rate": 9.160991113705649e-05, "loss": 0.0094, "step": 128510 }, { "epoch": 1.39, "learning_rate": 9.159369527145357e-05, "loss": 0.0087, "step": 128520 }, { "epoch": 1.39, "learning_rate": 9.157747940585068e-05, "loss": 0.0072, "step": 128530 }, { "epoch": 1.39, "learning_rate": 9.156126354024777e-05, "loss": 0.0095, "step": 128540 }, { "epoch": 1.39, "learning_rate": 9.154504767464486e-05, "loss": 0.0095, "step": 128550 }, { "epoch": 1.39, "learning_rate": 9.152883180904196e-05, "loss": 0.0076, "step": 128560 }, { "epoch": 1.39, "learning_rate": 9.151261594343905e-05, "loss": 0.0088, "step": 128570 }, { "epoch": 1.39, "learning_rate": 9.149640007783614e-05, "loss": 0.008, "step": 128580 }, { "epoch": 1.39, "learning_rate": 9.148018421223325e-05, "loss": 0.0097, "step": 128590 }, { "epoch": 1.39, "learning_rate": 9.146396834663033e-05, "loss": 0.0077, "step": 128600 }, { "epoch": 1.39, "learning_rate": 9.144775248102743e-05, "loss": 0.0115, "step": 128610 }, { "epoch": 1.39, "learning_rate": 9.143153661542451e-05, "loss": 0.0102, "step": 128620 }, { "epoch": 1.39, "learning_rate": 9.141532074982162e-05, "loss": 0.0089, "step": 128630 }, { "epoch": 1.39, "learning_rate": 9.13991048842187e-05, "loss": 0.0083, "step": 128640 }, { "epoch": 1.39, "learning_rate": 9.13828890186158e-05, "loss": 0.0082, "step": 128650 }, { "epoch": 1.39, "learning_rate": 9.13666731530129e-05, "loss": 0.0099, "step": 128660 }, { "epoch": 1.39, "learning_rate": 9.135045728740999e-05, "loss": 0.0095, "step": 128670 }, { "epoch": 1.39, "learning_rate": 9.133424142180708e-05, "loss": 0.0081, "step": 128680 }, { "epoch": 1.39, "learning_rate": 9.131802555620419e-05, "loss": 0.0095, "step": 128690 }, { "epoch": 1.39, "learning_rate": 9.130180969060127e-05, "loss": 0.0082, "step": 128700 }, { "epoch": 1.39, "learning_rate": 9.128559382499837e-05, "loss": 0.0081, "step": 128710 }, { "epoch": 1.39, "learning_rate": 9.126937795939545e-05, "loss": 0.0078, "step": 128720 }, { "epoch": 1.39, "learning_rate": 9.125316209379256e-05, "loss": 0.0087, "step": 128730 }, { "epoch": 1.39, "learning_rate": 9.123694622818964e-05, "loss": 0.0074, "step": 128740 }, { "epoch": 1.39, "learning_rate": 9.122073036258675e-05, "loss": 0.0092, "step": 128750 }, { "epoch": 1.39, "learning_rate": 9.120451449698385e-05, "loss": 0.0081, "step": 128760 }, { "epoch": 1.39, "learning_rate": 9.118829863138093e-05, "loss": 0.0087, "step": 128770 }, { "epoch": 1.39, "learning_rate": 9.117208276577804e-05, "loss": 0.0081, "step": 128780 }, { "epoch": 1.39, "learning_rate": 9.115586690017512e-05, "loss": 0.0068, "step": 128790 }, { "epoch": 1.39, "learning_rate": 9.113965103457222e-05, "loss": 0.0084, "step": 128800 }, { "epoch": 1.39, "learning_rate": 9.112343516896932e-05, "loss": 0.0071, "step": 128810 }, { "epoch": 1.39, "learning_rate": 9.110721930336641e-05, "loss": 0.0076, "step": 128820 }, { "epoch": 1.39, "learning_rate": 9.10910034377635e-05, "loss": 0.0087, "step": 128830 }, { "epoch": 1.39, "learning_rate": 9.107478757216061e-05, "loss": 0.0092, "step": 128840 }, { "epoch": 1.39, "learning_rate": 9.105857170655769e-05, "loss": 0.009, "step": 128850 }, { "epoch": 1.39, "learning_rate": 9.104235584095479e-05, "loss": 0.0071, "step": 128860 }, { "epoch": 1.39, "learning_rate": 9.102613997535187e-05, "loss": 0.0079, "step": 128870 }, { "epoch": 1.39, "learning_rate": 9.100992410974898e-05, "loss": 0.008, "step": 128880 }, { "epoch": 1.39, "learning_rate": 9.099370824414606e-05, "loss": 0.0083, "step": 128890 }, { "epoch": 1.39, "learning_rate": 9.097749237854316e-05, "loss": 0.0076, "step": 128900 }, { "epoch": 1.39, "learning_rate": 9.096127651294026e-05, "loss": 0.009, "step": 128910 }, { "epoch": 1.39, "learning_rate": 9.094506064733735e-05, "loss": 0.0104, "step": 128920 }, { "epoch": 1.39, "learning_rate": 9.092884478173444e-05, "loss": 0.0072, "step": 128930 }, { "epoch": 1.39, "learning_rate": 9.091262891613155e-05, "loss": 0.0073, "step": 128940 }, { "epoch": 1.39, "learning_rate": 9.089641305052863e-05, "loss": 0.008, "step": 128950 }, { "epoch": 1.39, "learning_rate": 9.088019718492573e-05, "loss": 0.0083, "step": 128960 }, { "epoch": 1.39, "learning_rate": 9.086398131932281e-05, "loss": 0.0069, "step": 128970 }, { "epoch": 1.39, "learning_rate": 9.084776545371992e-05, "loss": 0.009, "step": 128980 }, { "epoch": 1.39, "learning_rate": 9.0831549588117e-05, "loss": 0.0088, "step": 128990 }, { "epoch": 1.39, "learning_rate": 9.08153337225141e-05, "loss": 0.0084, "step": 129000 }, { "epoch": 1.39, "eval_cer": 0.9215460437741146, "eval_loss": 0.0069303130730986595, "eval_runtime": 121.2397, "eval_samples_per_second": 16.496, "eval_steps_per_second": 4.124, "step": 129000 }, { "epoch": 1.39, "learning_rate": 9.07991178569112e-05, "loss": 0.0092, "step": 129010 }, { "epoch": 1.39, "learning_rate": 9.078290199130829e-05, "loss": 0.0114, "step": 129020 }, { "epoch": 1.39, "learning_rate": 9.076668612570538e-05, "loss": 0.0079, "step": 129030 }, { "epoch": 1.39, "learning_rate": 9.075047026010248e-05, "loss": 0.0062, "step": 129040 }, { "epoch": 1.4, "learning_rate": 9.073425439449957e-05, "loss": 0.0069, "step": 129050 }, { "epoch": 1.4, "learning_rate": 9.071803852889667e-05, "loss": 0.0105, "step": 129060 }, { "epoch": 1.4, "learning_rate": 9.070182266329375e-05, "loss": 0.0091, "step": 129070 }, { "epoch": 1.4, "learning_rate": 9.068560679769086e-05, "loss": 0.0091, "step": 129080 }, { "epoch": 1.4, "learning_rate": 9.066939093208794e-05, "loss": 0.0102, "step": 129090 }, { "epoch": 1.4, "learning_rate": 9.065317506648505e-05, "loss": 0.0086, "step": 129100 }, { "epoch": 1.4, "learning_rate": 9.063695920088212e-05, "loss": 0.0098, "step": 129110 }, { "epoch": 1.4, "learning_rate": 9.062074333527923e-05, "loss": 0.0091, "step": 129120 }, { "epoch": 1.4, "learning_rate": 9.060452746967632e-05, "loss": 0.0096, "step": 129130 }, { "epoch": 1.4, "learning_rate": 9.058831160407342e-05, "loss": 0.0071, "step": 129140 }, { "epoch": 1.4, "learning_rate": 9.057209573847051e-05, "loss": 0.0099, "step": 129150 }, { "epoch": 1.4, "learning_rate": 9.055587987286762e-05, "loss": 0.0074, "step": 129160 }, { "epoch": 1.4, "learning_rate": 9.05396640072647e-05, "loss": 0.0095, "step": 129170 }, { "epoch": 1.4, "learning_rate": 9.05234481416618e-05, "loss": 0.0089, "step": 129180 }, { "epoch": 1.4, "learning_rate": 9.050723227605888e-05, "loss": 0.008, "step": 129190 }, { "epoch": 1.4, "learning_rate": 9.049101641045599e-05, "loss": 0.009, "step": 129200 }, { "epoch": 1.4, "learning_rate": 9.047480054485307e-05, "loss": 0.0079, "step": 129210 }, { "epoch": 1.4, "learning_rate": 9.045858467925017e-05, "loss": 0.0083, "step": 129220 }, { "epoch": 1.4, "learning_rate": 9.044236881364726e-05, "loss": 0.0075, "step": 129230 }, { "epoch": 1.4, "learning_rate": 9.042615294804436e-05, "loss": 0.0073, "step": 129240 }, { "epoch": 1.4, "learning_rate": 9.040993708244145e-05, "loss": 0.0083, "step": 129250 }, { "epoch": 1.4, "learning_rate": 9.039372121683854e-05, "loss": 0.009, "step": 129260 }, { "epoch": 1.4, "learning_rate": 9.037750535123564e-05, "loss": 0.0089, "step": 129270 }, { "epoch": 1.4, "learning_rate": 9.036128948563274e-05, "loss": 0.0087, "step": 129280 }, { "epoch": 1.4, "learning_rate": 9.034507362002982e-05, "loss": 0.0077, "step": 129290 }, { "epoch": 1.4, "learning_rate": 9.032885775442693e-05, "loss": 0.0074, "step": 129300 }, { "epoch": 1.4, "learning_rate": 9.0312641888824e-05, "loss": 0.0088, "step": 129310 }, { "epoch": 1.4, "learning_rate": 9.029642602322111e-05, "loss": 0.0079, "step": 129320 }, { "epoch": 1.4, "learning_rate": 9.02802101576182e-05, "loss": 0.0068, "step": 129330 }, { "epoch": 1.4, "learning_rate": 9.02639942920153e-05, "loss": 0.0093, "step": 129340 }, { "epoch": 1.4, "learning_rate": 9.024777842641239e-05, "loss": 0.0054, "step": 129350 }, { "epoch": 1.4, "learning_rate": 9.023156256080948e-05, "loss": 0.008, "step": 129360 }, { "epoch": 1.4, "learning_rate": 9.021534669520658e-05, "loss": 0.0073, "step": 129370 }, { "epoch": 1.4, "learning_rate": 9.019913082960368e-05, "loss": 0.0097, "step": 129380 }, { "epoch": 1.4, "learning_rate": 9.018291496400076e-05, "loss": 0.0081, "step": 129390 }, { "epoch": 1.4, "learning_rate": 9.016669909839787e-05, "loss": 0.0061, "step": 129400 }, { "epoch": 1.4, "learning_rate": 9.015048323279495e-05, "loss": 0.0078, "step": 129410 }, { "epoch": 1.4, "learning_rate": 9.013426736719205e-05, "loss": 0.0069, "step": 129420 }, { "epoch": 1.4, "learning_rate": 9.011805150158913e-05, "loss": 0.0072, "step": 129430 }, { "epoch": 1.4, "learning_rate": 9.010183563598624e-05, "loss": 0.0082, "step": 129440 }, { "epoch": 1.4, "learning_rate": 9.008561977038333e-05, "loss": 0.009, "step": 129450 }, { "epoch": 1.4, "learning_rate": 9.006940390478042e-05, "loss": 0.0061, "step": 129460 }, { "epoch": 1.4, "learning_rate": 9.005318803917752e-05, "loss": 0.0085, "step": 129470 }, { "epoch": 1.4, "learning_rate": 9.003697217357462e-05, "loss": 0.0067, "step": 129480 }, { "epoch": 1.4, "learning_rate": 9.002075630797172e-05, "loss": 0.0077, "step": 129490 }, { "epoch": 1.4, "learning_rate": 9.000454044236881e-05, "loss": 0.0095, "step": 129500 }, { "epoch": 1.4, "learning_rate": 8.99883245767659e-05, "loss": 0.0094, "step": 129510 }, { "epoch": 1.4, "learning_rate": 8.9972108711163e-05, "loss": 0.0076, "step": 129520 }, { "epoch": 1.4, "learning_rate": 8.99558928455601e-05, "loss": 0.0086, "step": 129530 }, { "epoch": 1.4, "learning_rate": 8.993967697995718e-05, "loss": 0.0084, "step": 129540 }, { "epoch": 1.4, "learning_rate": 8.992346111435429e-05, "loss": 0.0064, "step": 129550 }, { "epoch": 1.4, "learning_rate": 8.990724524875137e-05, "loss": 0.0095, "step": 129560 }, { "epoch": 1.4, "learning_rate": 8.989102938314847e-05, "loss": 0.0085, "step": 129570 }, { "epoch": 1.4, "learning_rate": 8.987481351754555e-05, "loss": 0.0087, "step": 129580 }, { "epoch": 1.4, "learning_rate": 8.985859765194266e-05, "loss": 0.0073, "step": 129590 }, { "epoch": 1.4, "learning_rate": 8.984238178633975e-05, "loss": 0.0101, "step": 129600 }, { "epoch": 1.4, "learning_rate": 8.982616592073684e-05, "loss": 0.0082, "step": 129610 }, { "epoch": 1.4, "learning_rate": 8.980995005513394e-05, "loss": 0.0096, "step": 129620 }, { "epoch": 1.4, "learning_rate": 8.979373418953104e-05, "loss": 0.0087, "step": 129630 }, { "epoch": 1.4, "learning_rate": 8.977751832392812e-05, "loss": 0.0081, "step": 129640 }, { "epoch": 1.4, "learning_rate": 8.976130245832523e-05, "loss": 0.0107, "step": 129650 }, { "epoch": 1.4, "learning_rate": 8.974508659272231e-05, "loss": 0.0091, "step": 129660 }, { "epoch": 1.4, "learning_rate": 8.972887072711941e-05, "loss": 0.0065, "step": 129670 }, { "epoch": 1.4, "learning_rate": 8.971265486151649e-05, "loss": 0.0075, "step": 129680 }, { "epoch": 1.4, "learning_rate": 8.96964389959136e-05, "loss": 0.0075, "step": 129690 }, { "epoch": 1.4, "learning_rate": 8.968022313031069e-05, "loss": 0.0098, "step": 129700 }, { "epoch": 1.4, "learning_rate": 8.966400726470778e-05, "loss": 0.0084, "step": 129710 }, { "epoch": 1.4, "learning_rate": 8.964779139910488e-05, "loss": 0.0107, "step": 129720 }, { "epoch": 1.4, "learning_rate": 8.963157553350197e-05, "loss": 0.0099, "step": 129730 }, { "epoch": 1.4, "learning_rate": 8.961535966789906e-05, "loss": 0.0087, "step": 129740 }, { "epoch": 1.4, "learning_rate": 8.959914380229617e-05, "loss": 0.0075, "step": 129750 }, { "epoch": 1.4, "learning_rate": 8.958292793669325e-05, "loss": 0.0077, "step": 129760 }, { "epoch": 1.4, "learning_rate": 8.956671207109035e-05, "loss": 0.0089, "step": 129770 }, { "epoch": 1.4, "learning_rate": 8.955049620548743e-05, "loss": 0.0104, "step": 129780 }, { "epoch": 1.4, "learning_rate": 8.953428033988454e-05, "loss": 0.0125, "step": 129790 }, { "epoch": 1.4, "learning_rate": 8.951806447428162e-05, "loss": 0.0079, "step": 129800 }, { "epoch": 1.4, "learning_rate": 8.950184860867873e-05, "loss": 0.0098, "step": 129810 }, { "epoch": 1.4, "learning_rate": 8.948563274307582e-05, "loss": 0.0077, "step": 129820 }, { "epoch": 1.4, "learning_rate": 8.946941687747291e-05, "loss": 0.0093, "step": 129830 }, { "epoch": 1.4, "learning_rate": 8.945320101187e-05, "loss": 0.0082, "step": 129840 }, { "epoch": 1.4, "learning_rate": 8.943698514626711e-05, "loss": 0.0085, "step": 129850 }, { "epoch": 1.4, "learning_rate": 8.942076928066419e-05, "loss": 0.0107, "step": 129860 }, { "epoch": 1.4, "learning_rate": 8.94045534150613e-05, "loss": 0.009, "step": 129870 }, { "epoch": 1.4, "learning_rate": 8.938833754945837e-05, "loss": 0.0063, "step": 129880 }, { "epoch": 1.4, "learning_rate": 8.937212168385548e-05, "loss": 0.0093, "step": 129890 }, { "epoch": 1.4, "learning_rate": 8.935590581825256e-05, "loss": 0.0084, "step": 129900 }, { "epoch": 1.4, "learning_rate": 8.933968995264967e-05, "loss": 0.0072, "step": 129910 }, { "epoch": 1.4, "learning_rate": 8.932347408704676e-05, "loss": 0.0078, "step": 129920 }, { "epoch": 1.4, "learning_rate": 8.930725822144385e-05, "loss": 0.008, "step": 129930 }, { "epoch": 1.4, "learning_rate": 8.929104235584094e-05, "loss": 0.007, "step": 129940 }, { "epoch": 1.4, "learning_rate": 8.927482649023805e-05, "loss": 0.0082, "step": 129950 }, { "epoch": 1.4, "learning_rate": 8.925861062463513e-05, "loss": 0.0094, "step": 129960 }, { "epoch": 1.41, "learning_rate": 8.924239475903224e-05, "loss": 0.0065, "step": 129970 }, { "epoch": 1.41, "learning_rate": 8.922617889342932e-05, "loss": 0.0075, "step": 129980 }, { "epoch": 1.41, "learning_rate": 8.920996302782642e-05, "loss": 0.0081, "step": 129990 }, { "epoch": 1.41, "learning_rate": 8.91937471622235e-05, "loss": 0.0085, "step": 130000 }, { "epoch": 1.41, "eval_cer": 0.9215477809800273, "eval_loss": 0.00709355715662241, "eval_runtime": 121.4935, "eval_samples_per_second": 16.462, "eval_steps_per_second": 4.115, "step": 130000 }, { "epoch": 1.41, "learning_rate": 8.917753129662061e-05, "loss": 0.0091, "step": 130010 }, { "epoch": 1.41, "learning_rate": 8.91613154310177e-05, "loss": 0.0071, "step": 130020 }, { "epoch": 1.41, "learning_rate": 8.914509956541479e-05, "loss": 0.0094, "step": 130030 }, { "epoch": 1.41, "learning_rate": 8.912888369981189e-05, "loss": 0.0084, "step": 130040 }, { "epoch": 1.41, "learning_rate": 8.911266783420898e-05, "loss": 0.01, "step": 130050 }, { "epoch": 1.41, "learning_rate": 8.909645196860607e-05, "loss": 0.0062, "step": 130060 }, { "epoch": 1.41, "learning_rate": 8.908023610300318e-05, "loss": 0.0074, "step": 130070 }, { "epoch": 1.41, "learning_rate": 8.906402023740026e-05, "loss": 0.0084, "step": 130080 }, { "epoch": 1.41, "learning_rate": 8.904780437179736e-05, "loss": 0.0077, "step": 130090 }, { "epoch": 1.41, "learning_rate": 8.903158850619444e-05, "loss": 0.0069, "step": 130100 }, { "epoch": 1.41, "learning_rate": 8.901537264059155e-05, "loss": 0.0106, "step": 130110 }, { "epoch": 1.41, "learning_rate": 8.899915677498863e-05, "loss": 0.0089, "step": 130120 }, { "epoch": 1.41, "learning_rate": 8.898294090938573e-05, "loss": 0.0076, "step": 130130 }, { "epoch": 1.41, "learning_rate": 8.896672504378283e-05, "loss": 0.0072, "step": 130140 }, { "epoch": 1.41, "learning_rate": 8.895050917817992e-05, "loss": 0.007, "step": 130150 }, { "epoch": 1.41, "learning_rate": 8.893429331257701e-05, "loss": 0.0102, "step": 130160 }, { "epoch": 1.41, "learning_rate": 8.891807744697412e-05, "loss": 0.0082, "step": 130170 }, { "epoch": 1.41, "learning_rate": 8.89018615813712e-05, "loss": 0.0064, "step": 130180 }, { "epoch": 1.41, "learning_rate": 8.88856457157683e-05, "loss": 0.0098, "step": 130190 }, { "epoch": 1.41, "learning_rate": 8.88694298501654e-05, "loss": 0.0082, "step": 130200 }, { "epoch": 1.41, "learning_rate": 8.885321398456249e-05, "loss": 0.0123, "step": 130210 }, { "epoch": 1.41, "learning_rate": 8.88369981189596e-05, "loss": 0.008, "step": 130220 }, { "epoch": 1.41, "learning_rate": 8.882078225335667e-05, "loss": 0.0114, "step": 130230 }, { "epoch": 1.41, "learning_rate": 8.880456638775378e-05, "loss": 0.0089, "step": 130240 }, { "epoch": 1.41, "learning_rate": 8.878835052215086e-05, "loss": 0.0083, "step": 130250 }, { "epoch": 1.41, "learning_rate": 8.877213465654797e-05, "loss": 0.0099, "step": 130260 }, { "epoch": 1.41, "learning_rate": 8.875591879094505e-05, "loss": 0.0069, "step": 130270 }, { "epoch": 1.41, "learning_rate": 8.873970292534215e-05, "loss": 0.0062, "step": 130280 }, { "epoch": 1.41, "learning_rate": 8.872348705973924e-05, "loss": 0.0085, "step": 130290 }, { "epoch": 1.41, "learning_rate": 8.870727119413634e-05, "loss": 0.0091, "step": 130300 }, { "epoch": 1.41, "learning_rate": 8.869105532853343e-05, "loss": 0.0124, "step": 130310 }, { "epoch": 1.41, "learning_rate": 8.867483946293054e-05, "loss": 0.0075, "step": 130320 }, { "epoch": 1.41, "learning_rate": 8.865862359732762e-05, "loss": 0.0082, "step": 130330 }, { "epoch": 1.41, "learning_rate": 8.864240773172472e-05, "loss": 0.008, "step": 130340 }, { "epoch": 1.41, "learning_rate": 8.86261918661218e-05, "loss": 0.0089, "step": 130350 }, { "epoch": 1.41, "learning_rate": 8.860997600051891e-05, "loss": 0.0095, "step": 130360 }, { "epoch": 1.41, "learning_rate": 8.859376013491599e-05, "loss": 0.012, "step": 130370 }, { "epoch": 1.41, "learning_rate": 8.857754426931309e-05, "loss": 0.0072, "step": 130380 }, { "epoch": 1.41, "learning_rate": 8.856132840371019e-05, "loss": 0.0082, "step": 130390 }, { "epoch": 1.41, "learning_rate": 8.854511253810728e-05, "loss": 0.0085, "step": 130400 }, { "epoch": 1.41, "learning_rate": 8.852889667250437e-05, "loss": 0.0102, "step": 130410 }, { "epoch": 1.41, "learning_rate": 8.851268080690146e-05, "loss": 0.0081, "step": 130420 }, { "epoch": 1.41, "learning_rate": 8.849646494129856e-05, "loss": 0.0087, "step": 130430 }, { "epoch": 1.41, "learning_rate": 8.848024907569566e-05, "loss": 0.007, "step": 130440 }, { "epoch": 1.41, "learning_rate": 8.846403321009274e-05, "loss": 0.0087, "step": 130450 }, { "epoch": 1.41, "learning_rate": 8.844781734448985e-05, "loss": 0.0107, "step": 130460 }, { "epoch": 1.41, "learning_rate": 8.843160147888693e-05, "loss": 0.0101, "step": 130470 }, { "epoch": 1.41, "learning_rate": 8.841538561328403e-05, "loss": 0.0078, "step": 130480 }, { "epoch": 1.41, "learning_rate": 8.839916974768113e-05, "loss": 0.0086, "step": 130490 }, { "epoch": 1.41, "learning_rate": 8.838295388207822e-05, "loss": 0.0079, "step": 130500 }, { "epoch": 1.41, "learning_rate": 8.836673801647531e-05, "loss": 0.0069, "step": 130510 }, { "epoch": 1.41, "learning_rate": 8.83505221508724e-05, "loss": 0.0068, "step": 130520 }, { "epoch": 1.41, "learning_rate": 8.83343062852695e-05, "loss": 0.0078, "step": 130530 }, { "epoch": 1.41, "learning_rate": 8.83180904196666e-05, "loss": 0.0102, "step": 130540 }, { "epoch": 1.41, "learning_rate": 8.830187455406368e-05, "loss": 0.0108, "step": 130550 }, { "epoch": 1.41, "learning_rate": 8.828565868846079e-05, "loss": 0.0078, "step": 130560 }, { "epoch": 1.41, "learning_rate": 8.826944282285787e-05, "loss": 0.0093, "step": 130570 }, { "epoch": 1.41, "learning_rate": 8.825322695725497e-05, "loss": 0.0089, "step": 130580 }, { "epoch": 1.41, "learning_rate": 8.823701109165205e-05, "loss": 0.0084, "step": 130590 }, { "epoch": 1.41, "learning_rate": 8.822079522604916e-05, "loss": 0.0086, "step": 130600 }, { "epoch": 1.41, "learning_rate": 8.820457936044625e-05, "loss": 0.0113, "step": 130610 }, { "epoch": 1.41, "learning_rate": 8.818836349484335e-05, "loss": 0.008, "step": 130620 }, { "epoch": 1.41, "learning_rate": 8.817214762924044e-05, "loss": 0.0088, "step": 130630 }, { "epoch": 1.41, "learning_rate": 8.815593176363754e-05, "loss": 0.0088, "step": 130640 }, { "epoch": 1.41, "learning_rate": 8.813971589803462e-05, "loss": 0.0109, "step": 130650 }, { "epoch": 1.41, "learning_rate": 8.812350003243173e-05, "loss": 0.0092, "step": 130660 }, { "epoch": 1.41, "learning_rate": 8.810728416682881e-05, "loss": 0.008, "step": 130670 }, { "epoch": 1.41, "learning_rate": 8.809106830122592e-05, "loss": 0.0088, "step": 130680 }, { "epoch": 1.41, "learning_rate": 8.8074852435623e-05, "loss": 0.008, "step": 130690 }, { "epoch": 1.41, "learning_rate": 8.80586365700201e-05, "loss": 0.0066, "step": 130700 }, { "epoch": 1.41, "learning_rate": 8.80424207044172e-05, "loss": 0.0084, "step": 130710 }, { "epoch": 1.41, "learning_rate": 8.802620483881429e-05, "loss": 0.0095, "step": 130720 }, { "epoch": 1.41, "learning_rate": 8.800998897321138e-05, "loss": 0.0069, "step": 130730 }, { "epoch": 1.41, "learning_rate": 8.799377310760847e-05, "loss": 0.0063, "step": 130740 }, { "epoch": 1.41, "learning_rate": 8.797755724200556e-05, "loss": 0.0081, "step": 130750 }, { "epoch": 1.41, "learning_rate": 8.796134137640267e-05, "loss": 0.0089, "step": 130760 }, { "epoch": 1.41, "learning_rate": 8.794512551079975e-05, "loss": 0.0097, "step": 130770 }, { "epoch": 1.41, "learning_rate": 8.792890964519686e-05, "loss": 0.006, "step": 130780 }, { "epoch": 1.41, "learning_rate": 8.791269377959394e-05, "loss": 0.0092, "step": 130790 }, { "epoch": 1.41, "learning_rate": 8.789647791399104e-05, "loss": 0.0094, "step": 130800 }, { "epoch": 1.41, "learning_rate": 8.788026204838812e-05, "loss": 0.0094, "step": 130810 }, { "epoch": 1.41, "learning_rate": 8.786404618278523e-05, "loss": 0.0106, "step": 130820 }, { "epoch": 1.41, "learning_rate": 8.784783031718232e-05, "loss": 0.009, "step": 130830 }, { "epoch": 1.41, "learning_rate": 8.783161445157941e-05, "loss": 0.0082, "step": 130840 }, { "epoch": 1.41, "learning_rate": 8.78153985859765e-05, "loss": 0.007, "step": 130850 }, { "epoch": 1.41, "learning_rate": 8.779918272037361e-05, "loss": 0.0073, "step": 130860 }, { "epoch": 1.41, "learning_rate": 8.778296685477069e-05, "loss": 0.0079, "step": 130870 }, { "epoch": 1.41, "learning_rate": 8.77667509891678e-05, "loss": 0.0079, "step": 130880 }, { "epoch": 1.41, "learning_rate": 8.775053512356488e-05, "loss": 0.0069, "step": 130890 }, { "epoch": 1.42, "learning_rate": 8.773431925796198e-05, "loss": 0.0074, "step": 130900 }, { "epoch": 1.42, "learning_rate": 8.771810339235906e-05, "loss": 0.0086, "step": 130910 }, { "epoch": 1.42, "learning_rate": 8.770188752675617e-05, "loss": 0.0097, "step": 130920 }, { "epoch": 1.42, "learning_rate": 8.768567166115328e-05, "loss": 0.0093, "step": 130930 }, { "epoch": 1.42, "learning_rate": 8.766945579555035e-05, "loss": 0.008, "step": 130940 }, { "epoch": 1.42, "learning_rate": 8.765323992994746e-05, "loss": 0.0093, "step": 130950 }, { "epoch": 1.42, "learning_rate": 8.763702406434455e-05, "loss": 0.0078, "step": 130960 }, { "epoch": 1.42, "learning_rate": 8.762080819874165e-05, "loss": 0.0066, "step": 130970 }, { "epoch": 1.42, "learning_rate": 8.760459233313874e-05, "loss": 0.0082, "step": 130980 }, { "epoch": 1.42, "learning_rate": 8.758837646753583e-05, "loss": 0.0081, "step": 130990 }, { "epoch": 1.42, "learning_rate": 8.757216060193292e-05, "loss": 0.0107, "step": 131000 }, { "epoch": 1.42, "eval_cer": 0.9215486495829838, "eval_loss": 0.006674186792224646, "eval_runtime": 121.2703, "eval_samples_per_second": 16.492, "eval_steps_per_second": 4.123, "step": 131000 }, { "epoch": 1.42, "learning_rate": 8.755594473633003e-05, "loss": 0.013, "step": 131010 }, { "epoch": 1.42, "learning_rate": 8.753972887072711e-05, "loss": 0.0081, "step": 131020 }, { "epoch": 1.42, "learning_rate": 8.752351300512422e-05, "loss": 0.0114, "step": 131030 }, { "epoch": 1.42, "learning_rate": 8.75072971395213e-05, "loss": 0.0084, "step": 131040 }, { "epoch": 1.42, "learning_rate": 8.74910812739184e-05, "loss": 0.0119, "step": 131050 }, { "epoch": 1.42, "learning_rate": 8.747486540831548e-05, "loss": 0.0089, "step": 131060 }, { "epoch": 1.42, "learning_rate": 8.745864954271259e-05, "loss": 0.0105, "step": 131070 }, { "epoch": 1.42, "learning_rate": 8.744243367710968e-05, "loss": 0.0085, "step": 131080 }, { "epoch": 1.42, "learning_rate": 8.742621781150677e-05, "loss": 0.0078, "step": 131090 }, { "epoch": 1.42, "learning_rate": 8.741000194590387e-05, "loss": 0.0112, "step": 131100 }, { "epoch": 1.42, "learning_rate": 8.739378608030097e-05, "loss": 0.0083, "step": 131110 }, { "epoch": 1.42, "learning_rate": 8.737757021469805e-05, "loss": 0.0093, "step": 131120 }, { "epoch": 1.42, "learning_rate": 8.736135434909516e-05, "loss": 0.0079, "step": 131130 }, { "epoch": 1.42, "learning_rate": 8.734513848349224e-05, "loss": 0.0069, "step": 131140 }, { "epoch": 1.42, "learning_rate": 8.732892261788934e-05, "loss": 0.0067, "step": 131150 }, { "epoch": 1.42, "learning_rate": 8.731270675228642e-05, "loss": 0.0081, "step": 131160 }, { "epoch": 1.42, "learning_rate": 8.729649088668353e-05, "loss": 0.0074, "step": 131170 }, { "epoch": 1.42, "learning_rate": 8.728027502108062e-05, "loss": 0.0105, "step": 131180 }, { "epoch": 1.42, "learning_rate": 8.726405915547771e-05, "loss": 0.0089, "step": 131190 }, { "epoch": 1.42, "learning_rate": 8.72478432898748e-05, "loss": 0.008, "step": 131200 }, { "epoch": 1.42, "learning_rate": 8.72316274242719e-05, "loss": 0.0086, "step": 131210 }, { "epoch": 1.42, "learning_rate": 8.721541155866899e-05, "loss": 0.0063, "step": 131220 }, { "epoch": 1.42, "learning_rate": 8.71991956930661e-05, "loss": 0.0083, "step": 131230 }, { "epoch": 1.42, "learning_rate": 8.718297982746318e-05, "loss": 0.0104, "step": 131240 }, { "epoch": 1.42, "learning_rate": 8.716676396186028e-05, "loss": 0.0107, "step": 131250 }, { "epoch": 1.42, "learning_rate": 8.715054809625736e-05, "loss": 0.0082, "step": 131260 }, { "epoch": 1.42, "learning_rate": 8.713433223065447e-05, "loss": 0.0082, "step": 131270 }, { "epoch": 1.42, "learning_rate": 8.711811636505155e-05, "loss": 0.0068, "step": 131280 }, { "epoch": 1.42, "learning_rate": 8.710190049944865e-05, "loss": 0.007, "step": 131290 }, { "epoch": 1.42, "learning_rate": 8.708568463384575e-05, "loss": 0.0067, "step": 131300 }, { "epoch": 1.42, "learning_rate": 8.706946876824284e-05, "loss": 0.011, "step": 131310 }, { "epoch": 1.42, "learning_rate": 8.705325290263993e-05, "loss": 0.0088, "step": 131320 }, { "epoch": 1.42, "learning_rate": 8.703703703703704e-05, "loss": 0.0063, "step": 131330 }, { "epoch": 1.42, "learning_rate": 8.702082117143412e-05, "loss": 0.0077, "step": 131340 }, { "epoch": 1.42, "learning_rate": 8.700460530583122e-05, "loss": 0.007, "step": 131350 }, { "epoch": 1.42, "learning_rate": 8.69883894402283e-05, "loss": 0.0108, "step": 131360 }, { "epoch": 1.42, "learning_rate": 8.697217357462541e-05, "loss": 0.0073, "step": 131370 }, { "epoch": 1.42, "learning_rate": 8.695595770902249e-05, "loss": 0.0071, "step": 131380 }, { "epoch": 1.42, "learning_rate": 8.69397418434196e-05, "loss": 0.0077, "step": 131390 }, { "epoch": 1.42, "learning_rate": 8.692352597781669e-05, "loss": 0.0094, "step": 131400 }, { "epoch": 1.42, "learning_rate": 8.690731011221378e-05, "loss": 0.0116, "step": 131410 }, { "epoch": 1.42, "learning_rate": 8.689109424661087e-05, "loss": 0.0111, "step": 131420 }, { "epoch": 1.42, "learning_rate": 8.687487838100797e-05, "loss": 0.0128, "step": 131430 }, { "epoch": 1.42, "learning_rate": 8.685866251540506e-05, "loss": 0.0087, "step": 131440 }, { "epoch": 1.42, "learning_rate": 8.684244664980217e-05, "loss": 0.0074, "step": 131450 }, { "epoch": 1.42, "learning_rate": 8.682623078419924e-05, "loss": 0.0088, "step": 131460 }, { "epoch": 1.42, "learning_rate": 8.681001491859635e-05, "loss": 0.0085, "step": 131470 }, { "epoch": 1.42, "learning_rate": 8.679379905299343e-05, "loss": 0.0074, "step": 131480 }, { "epoch": 1.42, "learning_rate": 8.677758318739054e-05, "loss": 0.0079, "step": 131490 }, { "epoch": 1.42, "learning_rate": 8.676136732178763e-05, "loss": 0.0096, "step": 131500 }, { "epoch": 1.42, "learning_rate": 8.674515145618472e-05, "loss": 0.0075, "step": 131510 }, { "epoch": 1.42, "learning_rate": 8.672893559058181e-05, "loss": 0.0094, "step": 131520 }, { "epoch": 1.42, "learning_rate": 8.671271972497891e-05, "loss": 0.0073, "step": 131530 }, { "epoch": 1.42, "learning_rate": 8.6696503859376e-05, "loss": 0.0083, "step": 131540 }, { "epoch": 1.42, "learning_rate": 8.66802879937731e-05, "loss": 0.0091, "step": 131550 }, { "epoch": 1.42, "learning_rate": 8.666407212817019e-05, "loss": 0.0101, "step": 131560 }, { "epoch": 1.42, "learning_rate": 8.664785626256729e-05, "loss": 0.0073, "step": 131570 }, { "epoch": 1.42, "learning_rate": 8.663164039696437e-05, "loss": 0.0062, "step": 131580 }, { "epoch": 1.42, "learning_rate": 8.661542453136148e-05, "loss": 0.0088, "step": 131590 }, { "epoch": 1.42, "learning_rate": 8.659920866575856e-05, "loss": 0.0095, "step": 131600 }, { "epoch": 1.42, "learning_rate": 8.658299280015566e-05, "loss": 0.0067, "step": 131610 }, { "epoch": 1.42, "learning_rate": 8.656677693455276e-05, "loss": 0.0086, "step": 131620 }, { "epoch": 1.42, "learning_rate": 8.655056106894985e-05, "loss": 0.0075, "step": 131630 }, { "epoch": 1.42, "learning_rate": 8.653434520334695e-05, "loss": 0.0085, "step": 131640 }, { "epoch": 1.42, "learning_rate": 8.651812933774405e-05, "loss": 0.0076, "step": 131650 }, { "epoch": 1.42, "learning_rate": 8.650191347214114e-05, "loss": 0.0091, "step": 131660 }, { "epoch": 1.42, "learning_rate": 8.648569760653823e-05, "loss": 0.0067, "step": 131670 }, { "epoch": 1.42, "learning_rate": 8.646948174093533e-05, "loss": 0.0082, "step": 131680 }, { "epoch": 1.42, "learning_rate": 8.645326587533242e-05, "loss": 0.0094, "step": 131690 }, { "epoch": 1.42, "learning_rate": 8.643705000972952e-05, "loss": 0.0096, "step": 131700 }, { "epoch": 1.42, "learning_rate": 8.64208341441266e-05, "loss": 0.01, "step": 131710 }, { "epoch": 1.42, "learning_rate": 8.640461827852371e-05, "loss": 0.0068, "step": 131720 }, { "epoch": 1.42, "learning_rate": 8.638840241292079e-05, "loss": 0.0114, "step": 131730 }, { "epoch": 1.42, "learning_rate": 8.63721865473179e-05, "loss": 0.0067, "step": 131740 }, { "epoch": 1.42, "learning_rate": 8.635597068171497e-05, "loss": 0.0087, "step": 131750 }, { "epoch": 1.42, "learning_rate": 8.633975481611208e-05, "loss": 0.0087, "step": 131760 }, { "epoch": 1.42, "learning_rate": 8.632353895050917e-05, "loss": 0.0085, "step": 131770 }, { "epoch": 1.42, "learning_rate": 8.630732308490627e-05, "loss": 0.0076, "step": 131780 }, { "epoch": 1.42, "learning_rate": 8.629110721930336e-05, "loss": 0.0095, "step": 131790 }, { "epoch": 1.42, "learning_rate": 8.627489135370047e-05, "loss": 0.0104, "step": 131800 }, { "epoch": 1.42, "learning_rate": 8.625867548809754e-05, "loss": 0.0076, "step": 131810 }, { "epoch": 1.43, "learning_rate": 8.624245962249465e-05, "loss": 0.0084, "step": 131820 }, { "epoch": 1.43, "learning_rate": 8.622624375689173e-05, "loss": 0.0107, "step": 131830 }, { "epoch": 1.43, "learning_rate": 8.621002789128884e-05, "loss": 0.0081, "step": 131840 }, { "epoch": 1.43, "learning_rate": 8.619381202568592e-05, "loss": 0.007, "step": 131850 }, { "epoch": 1.43, "learning_rate": 8.617759616008302e-05, "loss": 0.0098, "step": 131860 }, { "epoch": 1.43, "learning_rate": 8.616138029448011e-05, "loss": 0.0059, "step": 131870 }, { "epoch": 1.43, "learning_rate": 8.614516442887721e-05, "loss": 0.008, "step": 131880 }, { "epoch": 1.43, "learning_rate": 8.61289485632743e-05, "loss": 0.0096, "step": 131890 }, { "epoch": 1.43, "learning_rate": 8.611273269767139e-05, "loss": 0.0068, "step": 131900 }, { "epoch": 1.43, "learning_rate": 8.609651683206849e-05, "loss": 0.01, "step": 131910 }, { "epoch": 1.43, "learning_rate": 8.608030096646559e-05, "loss": 0.0077, "step": 131920 }, { "epoch": 1.43, "learning_rate": 8.606408510086267e-05, "loss": 0.0074, "step": 131930 }, { "epoch": 1.43, "learning_rate": 8.604786923525978e-05, "loss": 0.0095, "step": 131940 }, { "epoch": 1.43, "learning_rate": 8.603165336965686e-05, "loss": 0.0076, "step": 131950 }, { "epoch": 1.43, "learning_rate": 8.601543750405396e-05, "loss": 0.0075, "step": 131960 }, { "epoch": 1.43, "learning_rate": 8.599922163845106e-05, "loss": 0.0088, "step": 131970 }, { "epoch": 1.43, "learning_rate": 8.598300577284815e-05, "loss": 0.0077, "step": 131980 }, { "epoch": 1.43, "learning_rate": 8.596678990724524e-05, "loss": 0.007, "step": 131990 }, { "epoch": 1.43, "learning_rate": 8.595057404164233e-05, "loss": 0.0064, "step": 132000 }, { "epoch": 1.43, "eval_cer": 0.9215443065682019, "eval_loss": 0.0068144891411066055, "eval_runtime": 121.5561, "eval_samples_per_second": 16.453, "eval_steps_per_second": 4.113, "step": 132000 }, { "epoch": 1.43, "learning_rate": 8.593435817603943e-05, "loss": 0.0065, "step": 132010 }, { "epoch": 1.43, "learning_rate": 8.591814231043653e-05, "loss": 0.0077, "step": 132020 }, { "epoch": 1.43, "learning_rate": 8.590192644483361e-05, "loss": 0.0081, "step": 132030 }, { "epoch": 1.43, "learning_rate": 8.588571057923072e-05, "loss": 0.0081, "step": 132040 }, { "epoch": 1.43, "learning_rate": 8.58694947136278e-05, "loss": 0.0067, "step": 132050 }, { "epoch": 1.43, "learning_rate": 8.58532788480249e-05, "loss": 0.0097, "step": 132060 }, { "epoch": 1.43, "learning_rate": 8.583706298242198e-05, "loss": 0.0108, "step": 132070 }, { "epoch": 1.43, "learning_rate": 8.582084711681909e-05, "loss": 0.0097, "step": 132080 }, { "epoch": 1.43, "learning_rate": 8.580463125121618e-05, "loss": 0.0083, "step": 132090 }, { "epoch": 1.43, "learning_rate": 8.578841538561328e-05, "loss": 0.0084, "step": 132100 }, { "epoch": 1.43, "learning_rate": 8.577219952001037e-05, "loss": 0.0083, "step": 132110 }, { "epoch": 1.43, "learning_rate": 8.575598365440747e-05, "loss": 0.0069, "step": 132120 }, { "epoch": 1.43, "learning_rate": 8.573976778880455e-05, "loss": 0.0072, "step": 132130 }, { "epoch": 1.43, "learning_rate": 8.572355192320166e-05, "loss": 0.0064, "step": 132140 }, { "epoch": 1.43, "learning_rate": 8.570733605759874e-05, "loss": 0.01, "step": 132150 }, { "epoch": 1.43, "learning_rate": 8.569112019199585e-05, "loss": 0.0085, "step": 132160 }, { "epoch": 1.43, "learning_rate": 8.567490432639292e-05, "loss": 0.0072, "step": 132170 }, { "epoch": 1.43, "learning_rate": 8.565868846079003e-05, "loss": 0.0096, "step": 132180 }, { "epoch": 1.43, "learning_rate": 8.564247259518712e-05, "loss": 0.01, "step": 132190 }, { "epoch": 1.43, "learning_rate": 8.562625672958422e-05, "loss": 0.0088, "step": 132200 }, { "epoch": 1.43, "learning_rate": 8.561004086398131e-05, "loss": 0.0109, "step": 132210 }, { "epoch": 1.43, "learning_rate": 8.55938249983784e-05, "loss": 0.0095, "step": 132220 }, { "epoch": 1.43, "learning_rate": 8.55776091327755e-05, "loss": 0.008, "step": 132230 }, { "epoch": 1.43, "learning_rate": 8.55613932671726e-05, "loss": 0.0081, "step": 132240 }, { "epoch": 1.43, "learning_rate": 8.554517740156968e-05, "loss": 0.0075, "step": 132250 }, { "epoch": 1.43, "learning_rate": 8.552896153596679e-05, "loss": 0.008, "step": 132260 }, { "epoch": 1.43, "learning_rate": 8.551274567036387e-05, "loss": 0.0111, "step": 132270 }, { "epoch": 1.43, "learning_rate": 8.549652980476097e-05, "loss": 0.0092, "step": 132280 }, { "epoch": 1.43, "learning_rate": 8.548031393915805e-05, "loss": 0.0083, "step": 132290 }, { "epoch": 1.43, "learning_rate": 8.546409807355516e-05, "loss": 0.0084, "step": 132300 }, { "epoch": 1.43, "learning_rate": 8.544788220795225e-05, "loss": 0.0067, "step": 132310 }, { "epoch": 1.43, "learning_rate": 8.543166634234934e-05, "loss": 0.0084, "step": 132320 }, { "epoch": 1.43, "learning_rate": 8.541545047674644e-05, "loss": 0.0112, "step": 132330 }, { "epoch": 1.43, "learning_rate": 8.539923461114354e-05, "loss": 0.0096, "step": 132340 }, { "epoch": 1.43, "learning_rate": 8.538301874554062e-05, "loss": 0.0066, "step": 132350 }, { "epoch": 1.43, "learning_rate": 8.536680287993773e-05, "loss": 0.0086, "step": 132360 }, { "epoch": 1.43, "learning_rate": 8.535058701433482e-05, "loss": 0.0083, "step": 132370 }, { "epoch": 1.43, "learning_rate": 8.533437114873191e-05, "loss": 0.0091, "step": 132380 }, { "epoch": 1.43, "learning_rate": 8.531815528312902e-05, "loss": 0.0097, "step": 132390 }, { "epoch": 1.43, "learning_rate": 8.53019394175261e-05, "loss": 0.0081, "step": 132400 }, { "epoch": 1.43, "learning_rate": 8.52857235519232e-05, "loss": 0.0089, "step": 132410 }, { "epoch": 1.43, "learning_rate": 8.526950768632028e-05, "loss": 0.0066, "step": 132420 }, { "epoch": 1.43, "learning_rate": 8.525329182071739e-05, "loss": 0.0074, "step": 132430 }, { "epoch": 1.43, "learning_rate": 8.523707595511447e-05, "loss": 0.008, "step": 132440 }, { "epoch": 1.43, "learning_rate": 8.522086008951158e-05, "loss": 0.0067, "step": 132450 }, { "epoch": 1.43, "learning_rate": 8.520464422390867e-05, "loss": 0.0094, "step": 132460 }, { "epoch": 1.43, "learning_rate": 8.518842835830576e-05, "loss": 0.0085, "step": 132470 }, { "epoch": 1.43, "learning_rate": 8.517221249270285e-05, "loss": 0.0078, "step": 132480 }, { "epoch": 1.43, "learning_rate": 8.515599662709996e-05, "loss": 0.0078, "step": 132490 }, { "epoch": 1.43, "learning_rate": 8.513978076149704e-05, "loss": 0.0088, "step": 132500 }, { "epoch": 1.43, "learning_rate": 8.512356489589415e-05, "loss": 0.0093, "step": 132510 }, { "epoch": 1.43, "learning_rate": 8.510734903029122e-05, "loss": 0.0087, "step": 132520 }, { "epoch": 1.43, "learning_rate": 8.509113316468833e-05, "loss": 0.0082, "step": 132530 }, { "epoch": 1.43, "learning_rate": 8.507491729908541e-05, "loss": 0.0111, "step": 132540 }, { "epoch": 1.43, "learning_rate": 8.505870143348252e-05, "loss": 0.0072, "step": 132550 }, { "epoch": 1.43, "learning_rate": 8.504248556787961e-05, "loss": 0.0067, "step": 132560 }, { "epoch": 1.43, "learning_rate": 8.50262697022767e-05, "loss": 0.0093, "step": 132570 }, { "epoch": 1.43, "learning_rate": 8.50100538366738e-05, "loss": 0.0088, "step": 132580 }, { "epoch": 1.43, "learning_rate": 8.499383797107089e-05, "loss": 0.0082, "step": 132590 }, { "epoch": 1.43, "learning_rate": 8.497762210546798e-05, "loss": 0.0105, "step": 132600 }, { "epoch": 1.43, "learning_rate": 8.496140623986509e-05, "loss": 0.0084, "step": 132610 }, { "epoch": 1.43, "learning_rate": 8.494519037426217e-05, "loss": 0.008, "step": 132620 }, { "epoch": 1.43, "learning_rate": 8.492897450865927e-05, "loss": 0.0074, "step": 132630 }, { "epoch": 1.43, "learning_rate": 8.491275864305635e-05, "loss": 0.0076, "step": 132640 }, { "epoch": 1.43, "learning_rate": 8.489654277745346e-05, "loss": 0.0085, "step": 132650 }, { "epoch": 1.43, "learning_rate": 8.488032691185055e-05, "loss": 0.0074, "step": 132660 }, { "epoch": 1.43, "learning_rate": 8.486411104624764e-05, "loss": 0.0099, "step": 132670 }, { "epoch": 1.43, "learning_rate": 8.484789518064474e-05, "loss": 0.0087, "step": 132680 }, { "epoch": 1.43, "learning_rate": 8.483167931504183e-05, "loss": 0.0076, "step": 132690 }, { "epoch": 1.43, "learning_rate": 8.481546344943892e-05, "loss": 0.0087, "step": 132700 }, { "epoch": 1.43, "learning_rate": 8.479924758383603e-05, "loss": 0.0093, "step": 132710 }, { "epoch": 1.43, "learning_rate": 8.47830317182331e-05, "loss": 0.0082, "step": 132720 }, { "epoch": 1.43, "learning_rate": 8.476681585263021e-05, "loss": 0.0087, "step": 132730 }, { "epoch": 1.43, "learning_rate": 8.475059998702729e-05, "loss": 0.008, "step": 132740 }, { "epoch": 1.44, "learning_rate": 8.47343841214244e-05, "loss": 0.0104, "step": 132750 }, { "epoch": 1.44, "learning_rate": 8.471816825582148e-05, "loss": 0.0083, "step": 132760 }, { "epoch": 1.44, "learning_rate": 8.470195239021858e-05, "loss": 0.007, "step": 132770 }, { "epoch": 1.44, "learning_rate": 8.468573652461568e-05, "loss": 0.0094, "step": 132780 }, { "epoch": 1.44, "learning_rate": 8.466952065901277e-05, "loss": 0.0067, "step": 132790 }, { "epoch": 1.44, "learning_rate": 8.465330479340986e-05, "loss": 0.0108, "step": 132800 }, { "epoch": 1.44, "learning_rate": 8.463708892780697e-05, "loss": 0.0093, "step": 132810 }, { "epoch": 1.44, "learning_rate": 8.462087306220405e-05, "loss": 0.0093, "step": 132820 }, { "epoch": 1.44, "learning_rate": 8.460465719660115e-05, "loss": 0.0084, "step": 132830 }, { "epoch": 1.44, "learning_rate": 8.458844133099823e-05, "loss": 0.0071, "step": 132840 }, { "epoch": 1.44, "learning_rate": 8.457222546539534e-05, "loss": 0.0105, "step": 132850 }, { "epoch": 1.44, "learning_rate": 8.455600959979242e-05, "loss": 0.0089, "step": 132860 }, { "epoch": 1.44, "learning_rate": 8.453979373418952e-05, "loss": 0.0088, "step": 132870 }, { "epoch": 1.44, "learning_rate": 8.452357786858662e-05, "loss": 0.0071, "step": 132880 }, { "epoch": 1.44, "learning_rate": 8.450736200298371e-05, "loss": 0.0086, "step": 132890 }, { "epoch": 1.44, "learning_rate": 8.44911461373808e-05, "loss": 0.0096, "step": 132900 }, { "epoch": 1.44, "learning_rate": 8.44749302717779e-05, "loss": 0.0102, "step": 132910 }, { "epoch": 1.44, "learning_rate": 8.445871440617499e-05, "loss": 0.0094, "step": 132920 }, { "epoch": 1.44, "learning_rate": 8.44424985405721e-05, "loss": 0.0092, "step": 132930 }, { "epoch": 1.44, "learning_rate": 8.442628267496917e-05, "loss": 0.0088, "step": 132940 }, { "epoch": 1.44, "learning_rate": 8.441006680936628e-05, "loss": 0.0088, "step": 132950 }, { "epoch": 1.44, "learning_rate": 8.439385094376336e-05, "loss": 0.01, "step": 132960 }, { "epoch": 1.44, "learning_rate": 8.437763507816047e-05, "loss": 0.008, "step": 132970 }, { "epoch": 1.44, "learning_rate": 8.436141921255754e-05, "loss": 0.007, "step": 132980 }, { "epoch": 1.44, "learning_rate": 8.434520334695465e-05, "loss": 0.0097, "step": 132990 }, { "epoch": 1.44, "learning_rate": 8.432898748135174e-05, "loss": 0.0064, "step": 133000 }, { "epoch": 1.44, "eval_cer": 0.9215364891415945, "eval_loss": 0.006863737478852272, "eval_runtime": 121.164, "eval_samples_per_second": 16.507, "eval_steps_per_second": 4.127, "step": 133000 }, { "epoch": 1.44, "learning_rate": 8.431277161574884e-05, "loss": 0.009, "step": 133010 }, { "epoch": 1.44, "learning_rate": 8.429655575014593e-05, "loss": 0.0063, "step": 133020 }, { "epoch": 1.44, "learning_rate": 8.428033988454304e-05, "loss": 0.008, "step": 133030 }, { "epoch": 1.44, "learning_rate": 8.426412401894011e-05, "loss": 0.0064, "step": 133040 }, { "epoch": 1.44, "learning_rate": 8.424790815333722e-05, "loss": 0.0092, "step": 133050 }, { "epoch": 1.44, "learning_rate": 8.42316922877343e-05, "loss": 0.008, "step": 133060 }, { "epoch": 1.44, "learning_rate": 8.42154764221314e-05, "loss": 0.0074, "step": 133070 }, { "epoch": 1.44, "learning_rate": 8.419926055652851e-05, "loss": 0.01, "step": 133080 }, { "epoch": 1.44, "learning_rate": 8.418304469092559e-05, "loss": 0.0095, "step": 133090 }, { "epoch": 1.44, "learning_rate": 8.41668288253227e-05, "loss": 0.0076, "step": 133100 }, { "epoch": 1.44, "learning_rate": 8.415061295971978e-05, "loss": 0.0086, "step": 133110 }, { "epoch": 1.44, "learning_rate": 8.413439709411688e-05, "loss": 0.0091, "step": 133120 }, { "epoch": 1.44, "learning_rate": 8.411818122851398e-05, "loss": 0.0102, "step": 133130 }, { "epoch": 1.44, "learning_rate": 8.410196536291107e-05, "loss": 0.0089, "step": 133140 }, { "epoch": 1.44, "learning_rate": 8.408574949730816e-05, "loss": 0.0067, "step": 133150 }, { "epoch": 1.44, "learning_rate": 8.406953363170525e-05, "loss": 0.0063, "step": 133160 }, { "epoch": 1.44, "learning_rate": 8.405331776610235e-05, "loss": 0.0085, "step": 133170 }, { "epoch": 1.44, "learning_rate": 8.403710190049945e-05, "loss": 0.0107, "step": 133180 }, { "epoch": 1.44, "learning_rate": 8.402088603489653e-05, "loss": 0.0109, "step": 133190 }, { "epoch": 1.44, "learning_rate": 8.400467016929364e-05, "loss": 0.0083, "step": 133200 }, { "epoch": 1.44, "learning_rate": 8.398845430369072e-05, "loss": 0.0078, "step": 133210 }, { "epoch": 1.44, "learning_rate": 8.397223843808782e-05, "loss": 0.0082, "step": 133220 }, { "epoch": 1.44, "learning_rate": 8.39560225724849e-05, "loss": 0.0098, "step": 133230 }, { "epoch": 1.44, "learning_rate": 8.393980670688201e-05, "loss": 0.0066, "step": 133240 }, { "epoch": 1.44, "learning_rate": 8.39235908412791e-05, "loss": 0.0063, "step": 133250 }, { "epoch": 1.44, "learning_rate": 8.39073749756762e-05, "loss": 0.0076, "step": 133260 }, { "epoch": 1.44, "learning_rate": 8.389115911007329e-05, "loss": 0.0085, "step": 133270 }, { "epoch": 1.44, "learning_rate": 8.38749432444704e-05, "loss": 0.0077, "step": 133280 }, { "epoch": 1.44, "learning_rate": 8.385872737886747e-05, "loss": 0.0072, "step": 133290 }, { "epoch": 1.44, "learning_rate": 8.384251151326458e-05, "loss": 0.0073, "step": 133300 }, { "epoch": 1.44, "learning_rate": 8.382629564766166e-05, "loss": 0.0072, "step": 133310 }, { "epoch": 1.44, "learning_rate": 8.381007978205877e-05, "loss": 0.0086, "step": 133320 }, { "epoch": 1.44, "learning_rate": 8.379386391645585e-05, "loss": 0.009, "step": 133330 }, { "epoch": 1.44, "learning_rate": 8.377764805085295e-05, "loss": 0.0079, "step": 133340 }, { "epoch": 1.44, "learning_rate": 8.376143218525004e-05, "loss": 0.0097, "step": 133350 }, { "epoch": 1.44, "learning_rate": 8.374521631964714e-05, "loss": 0.0083, "step": 133360 }, { "epoch": 1.44, "learning_rate": 8.372900045404423e-05, "loss": 0.0065, "step": 133370 }, { "epoch": 1.44, "learning_rate": 8.371278458844132e-05, "loss": 0.0094, "step": 133380 }, { "epoch": 1.44, "learning_rate": 8.369656872283842e-05, "loss": 0.0103, "step": 133390 }, { "epoch": 1.44, "learning_rate": 8.368035285723552e-05, "loss": 0.0083, "step": 133400 }, { "epoch": 1.44, "learning_rate": 8.36641369916326e-05, "loss": 0.0082, "step": 133410 }, { "epoch": 1.44, "learning_rate": 8.364792112602971e-05, "loss": 0.0077, "step": 133420 }, { "epoch": 1.44, "learning_rate": 8.363170526042679e-05, "loss": 0.0095, "step": 133430 }, { "epoch": 1.44, "learning_rate": 8.361548939482389e-05, "loss": 0.0088, "step": 133440 }, { "epoch": 1.44, "learning_rate": 8.359927352922097e-05, "loss": 0.0091, "step": 133450 }, { "epoch": 1.44, "learning_rate": 8.358305766361808e-05, "loss": 0.0107, "step": 133460 }, { "epoch": 1.44, "learning_rate": 8.356684179801517e-05, "loss": 0.0108, "step": 133470 }, { "epoch": 1.44, "learning_rate": 8.355062593241226e-05, "loss": 0.008, "step": 133480 }, { "epoch": 1.44, "learning_rate": 8.353441006680936e-05, "loss": 0.009, "step": 133490 }, { "epoch": 1.44, "learning_rate": 8.351819420120646e-05, "loss": 0.0068, "step": 133500 }, { "epoch": 1.44, "learning_rate": 8.350197833560354e-05, "loss": 0.0088, "step": 133510 }, { "epoch": 1.44, "learning_rate": 8.348576247000065e-05, "loss": 0.0076, "step": 133520 }, { "epoch": 1.44, "learning_rate": 8.346954660439773e-05, "loss": 0.0099, "step": 133530 }, { "epoch": 1.44, "learning_rate": 8.345333073879483e-05, "loss": 0.0102, "step": 133540 }, { "epoch": 1.44, "learning_rate": 8.343711487319191e-05, "loss": 0.0087, "step": 133550 }, { "epoch": 1.44, "learning_rate": 8.342089900758902e-05, "loss": 0.0097, "step": 133560 }, { "epoch": 1.44, "learning_rate": 8.340468314198611e-05, "loss": 0.0089, "step": 133570 }, { "epoch": 1.44, "learning_rate": 8.33884672763832e-05, "loss": 0.0097, "step": 133580 }, { "epoch": 1.44, "learning_rate": 8.33722514107803e-05, "loss": 0.0074, "step": 133590 }, { "epoch": 1.44, "learning_rate": 8.335603554517739e-05, "loss": 0.0078, "step": 133600 }, { "epoch": 1.44, "learning_rate": 8.333981967957448e-05, "loss": 0.0076, "step": 133610 }, { "epoch": 1.44, "learning_rate": 8.332360381397159e-05, "loss": 0.0081, "step": 133620 }, { "epoch": 1.44, "learning_rate": 8.330738794836867e-05, "loss": 0.0067, "step": 133630 }, { "epoch": 1.44, "learning_rate": 8.329117208276577e-05, "loss": 0.0105, "step": 133640 }, { "epoch": 1.44, "learning_rate": 8.327495621716285e-05, "loss": 0.0067, "step": 133650 }, { "epoch": 1.44, "learning_rate": 8.325874035155996e-05, "loss": 0.009, "step": 133660 }, { "epoch": 1.45, "learning_rate": 8.324252448595705e-05, "loss": 0.0078, "step": 133670 }, { "epoch": 1.45, "learning_rate": 8.322630862035415e-05, "loss": 0.0082, "step": 133680 }, { "epoch": 1.45, "learning_rate": 8.321009275475124e-05, "loss": 0.0091, "step": 133690 }, { "epoch": 1.45, "learning_rate": 8.319387688914833e-05, "loss": 0.0084, "step": 133700 }, { "epoch": 1.45, "learning_rate": 8.317766102354542e-05, "loss": 0.0091, "step": 133710 }, { "epoch": 1.45, "learning_rate": 8.316144515794253e-05, "loss": 0.0094, "step": 133720 }, { "epoch": 1.45, "learning_rate": 8.314522929233961e-05, "loss": 0.0064, "step": 133730 }, { "epoch": 1.45, "learning_rate": 8.312901342673672e-05, "loss": 0.0087, "step": 133740 }, { "epoch": 1.45, "learning_rate": 8.31127975611338e-05, "loss": 0.0082, "step": 133750 }, { "epoch": 1.45, "learning_rate": 8.30965816955309e-05, "loss": 0.007, "step": 133760 }, { "epoch": 1.45, "learning_rate": 8.308036582992798e-05, "loss": 0.0073, "step": 133770 }, { "epoch": 1.45, "learning_rate": 8.306414996432509e-05, "loss": 0.0088, "step": 133780 }, { "epoch": 1.45, "learning_rate": 8.304793409872219e-05, "loss": 0.0078, "step": 133790 }, { "epoch": 1.45, "learning_rate": 8.303171823311927e-05, "loss": 0.0071, "step": 133800 }, { "epoch": 1.45, "learning_rate": 8.301550236751638e-05, "loss": 0.007, "step": 133810 }, { "epoch": 1.45, "learning_rate": 8.299928650191347e-05, "loss": 0.0089, "step": 133820 }, { "epoch": 1.45, "learning_rate": 8.298307063631056e-05, "loss": 0.0083, "step": 133830 }, { "epoch": 1.45, "learning_rate": 8.296685477070766e-05, "loss": 0.0111, "step": 133840 }, { "epoch": 1.45, "learning_rate": 8.295063890510475e-05, "loss": 0.0072, "step": 133850 }, { "epoch": 1.45, "learning_rate": 8.293442303950184e-05, "loss": 0.0083, "step": 133860 }, { "epoch": 1.45, "learning_rate": 8.291820717389895e-05, "loss": 0.0083, "step": 133870 }, { "epoch": 1.45, "learning_rate": 8.290199130829603e-05, "loss": 0.0068, "step": 133880 }, { "epoch": 1.45, "learning_rate": 8.288577544269313e-05, "loss": 0.0069, "step": 133890 }, { "epoch": 1.45, "learning_rate": 8.286955957709021e-05, "loss": 0.0077, "step": 133900 }, { "epoch": 1.45, "learning_rate": 8.285334371148732e-05, "loss": 0.0072, "step": 133910 }, { "epoch": 1.45, "learning_rate": 8.28371278458844e-05, "loss": 0.0074, "step": 133920 }, { "epoch": 1.45, "learning_rate": 8.28209119802815e-05, "loss": 0.0077, "step": 133930 }, { "epoch": 1.45, "learning_rate": 8.28046961146786e-05, "loss": 0.0095, "step": 133940 }, { "epoch": 1.45, "learning_rate": 8.278848024907569e-05, "loss": 0.0084, "step": 133950 }, { "epoch": 1.45, "learning_rate": 8.277226438347278e-05, "loss": 0.0071, "step": 133960 }, { "epoch": 1.45, "learning_rate": 8.275604851786989e-05, "loss": 0.006, "step": 133970 }, { "epoch": 1.45, "learning_rate": 8.273983265226697e-05, "loss": 0.0092, "step": 133980 }, { "epoch": 1.45, "learning_rate": 8.272361678666407e-05, "loss": 0.0087, "step": 133990 }, { "epoch": 1.45, "learning_rate": 8.270740092106115e-05, "loss": 0.0139, "step": 134000 }, { "epoch": 1.45, "eval_cer": 0.9215547298036784, "eval_loss": 0.00670721335336566, "eval_runtime": 121.1717, "eval_samples_per_second": 16.506, "eval_steps_per_second": 4.126, "step": 134000 }, { "epoch": 1.45, "learning_rate": 8.269118505545826e-05, "loss": 0.0081, "step": 134010 }, { "epoch": 1.45, "learning_rate": 8.267496918985534e-05, "loss": 0.0101, "step": 134020 }, { "epoch": 1.45, "learning_rate": 8.265875332425245e-05, "loss": 0.0113, "step": 134030 }, { "epoch": 1.45, "learning_rate": 8.264253745864954e-05, "loss": 0.0072, "step": 134040 }, { "epoch": 1.45, "learning_rate": 8.262632159304663e-05, "loss": 0.0094, "step": 134050 }, { "epoch": 1.45, "learning_rate": 8.261010572744372e-05, "loss": 0.0072, "step": 134060 }, { "epoch": 1.45, "learning_rate": 8.259388986184082e-05, "loss": 0.0072, "step": 134070 }, { "epoch": 1.45, "learning_rate": 8.257767399623791e-05, "loss": 0.0075, "step": 134080 }, { "epoch": 1.45, "learning_rate": 8.256145813063502e-05, "loss": 0.0079, "step": 134090 }, { "epoch": 1.45, "learning_rate": 8.25452422650321e-05, "loss": 0.008, "step": 134100 }, { "epoch": 1.45, "learning_rate": 8.25290263994292e-05, "loss": 0.0077, "step": 134110 }, { "epoch": 1.45, "learning_rate": 8.251281053382628e-05, "loss": 0.008, "step": 134120 }, { "epoch": 1.45, "learning_rate": 8.249659466822339e-05, "loss": 0.0092, "step": 134130 }, { "epoch": 1.45, "learning_rate": 8.248037880262048e-05, "loss": 0.0065, "step": 134140 }, { "epoch": 1.45, "learning_rate": 8.246416293701757e-05, "loss": 0.0087, "step": 134150 }, { "epoch": 1.45, "learning_rate": 8.244794707141466e-05, "loss": 0.0077, "step": 134160 }, { "epoch": 1.45, "learning_rate": 8.243173120581176e-05, "loss": 0.009, "step": 134170 }, { "epoch": 1.45, "learning_rate": 8.241551534020885e-05, "loss": 0.0101, "step": 134180 }, { "epoch": 1.45, "learning_rate": 8.239929947460596e-05, "loss": 0.0085, "step": 134190 }, { "epoch": 1.45, "learning_rate": 8.238308360900304e-05, "loss": 0.0068, "step": 134200 }, { "epoch": 1.45, "learning_rate": 8.236686774340014e-05, "loss": 0.0096, "step": 134210 }, { "epoch": 1.45, "learning_rate": 8.235065187779722e-05, "loss": 0.0068, "step": 134220 }, { "epoch": 1.45, "learning_rate": 8.233443601219433e-05, "loss": 0.0083, "step": 134230 }, { "epoch": 1.45, "learning_rate": 8.23182201465914e-05, "loss": 0.0069, "step": 134240 }, { "epoch": 1.45, "learning_rate": 8.230200428098851e-05, "loss": 0.0077, "step": 134250 }, { "epoch": 1.45, "learning_rate": 8.22857884153856e-05, "loss": 0.0068, "step": 134260 }, { "epoch": 1.45, "learning_rate": 8.22695725497827e-05, "loss": 0.0086, "step": 134270 }, { "epoch": 1.45, "learning_rate": 8.225335668417979e-05, "loss": 0.0075, "step": 134280 }, { "epoch": 1.45, "learning_rate": 8.22371408185769e-05, "loss": 0.0074, "step": 134290 }, { "epoch": 1.45, "learning_rate": 8.222092495297398e-05, "loss": 0.0106, "step": 134300 }, { "epoch": 1.45, "learning_rate": 8.220470908737108e-05, "loss": 0.0084, "step": 134310 }, { "epoch": 1.45, "learning_rate": 8.218849322176816e-05, "loss": 0.0106, "step": 134320 }, { "epoch": 1.45, "learning_rate": 8.217227735616527e-05, "loss": 0.0084, "step": 134330 }, { "epoch": 1.45, "learning_rate": 8.215606149056235e-05, "loss": 0.009, "step": 134340 }, { "epoch": 1.45, "learning_rate": 8.213984562495945e-05, "loss": 0.0086, "step": 134350 }, { "epoch": 1.45, "learning_rate": 8.212362975935655e-05, "loss": 0.0076, "step": 134360 }, { "epoch": 1.45, "learning_rate": 8.210741389375364e-05, "loss": 0.0077, "step": 134370 }, { "epoch": 1.45, "learning_rate": 8.209119802815073e-05, "loss": 0.0078, "step": 134380 }, { "epoch": 1.45, "learning_rate": 8.207498216254783e-05, "loss": 0.0106, "step": 134390 }, { "epoch": 1.45, "learning_rate": 8.205876629694492e-05, "loss": 0.0086, "step": 134400 }, { "epoch": 1.45, "learning_rate": 8.204255043134202e-05, "loss": 0.0095, "step": 134410 }, { "epoch": 1.45, "learning_rate": 8.20263345657391e-05, "loss": 0.0082, "step": 134420 }, { "epoch": 1.45, "learning_rate": 8.201011870013621e-05, "loss": 0.0076, "step": 134430 }, { "epoch": 1.45, "learning_rate": 8.199390283453329e-05, "loss": 0.009, "step": 134440 }, { "epoch": 1.45, "learning_rate": 8.19776869689304e-05, "loss": 0.0077, "step": 134450 }, { "epoch": 1.45, "learning_rate": 8.196147110332747e-05, "loss": 0.0077, "step": 134460 }, { "epoch": 1.45, "learning_rate": 8.194525523772458e-05, "loss": 0.0076, "step": 134470 }, { "epoch": 1.45, "learning_rate": 8.192903937212167e-05, "loss": 0.0089, "step": 134480 }, { "epoch": 1.45, "learning_rate": 8.191282350651877e-05, "loss": 0.0087, "step": 134490 }, { "epoch": 1.45, "learning_rate": 8.189660764091586e-05, "loss": 0.0083, "step": 134500 }, { "epoch": 1.45, "learning_rate": 8.188039177531297e-05, "loss": 0.0076, "step": 134510 }, { "epoch": 1.45, "learning_rate": 8.186417590971006e-05, "loss": 0.0075, "step": 134520 }, { "epoch": 1.45, "learning_rate": 8.184796004410715e-05, "loss": 0.0074, "step": 134530 }, { "epoch": 1.45, "learning_rate": 8.183174417850424e-05, "loss": 0.0068, "step": 134540 }, { "epoch": 1.45, "learning_rate": 8.181552831290134e-05, "loss": 0.0068, "step": 134550 }, { "epoch": 1.45, "learning_rate": 8.179931244729844e-05, "loss": 0.0072, "step": 134560 }, { "epoch": 1.45, "learning_rate": 8.178309658169552e-05, "loss": 0.0089, "step": 134570 }, { "epoch": 1.45, "learning_rate": 8.176688071609263e-05, "loss": 0.0079, "step": 134580 }, { "epoch": 1.45, "learning_rate": 8.175066485048971e-05, "loss": 0.0069, "step": 134590 }, { "epoch": 1.46, "learning_rate": 8.173444898488681e-05, "loss": 0.0104, "step": 134600 }, { "epoch": 1.46, "learning_rate": 8.171823311928389e-05, "loss": 0.0079, "step": 134610 }, { "epoch": 1.46, "learning_rate": 8.1702017253681e-05, "loss": 0.0096, "step": 134620 }, { "epoch": 1.46, "learning_rate": 8.168580138807809e-05, "loss": 0.0065, "step": 134630 }, { "epoch": 1.46, "learning_rate": 8.166958552247518e-05, "loss": 0.0104, "step": 134640 }, { "epoch": 1.46, "learning_rate": 8.165336965687228e-05, "loss": 0.0202, "step": 134650 }, { "epoch": 1.46, "learning_rate": 8.163715379126938e-05, "loss": 0.008, "step": 134660 }, { "epoch": 1.46, "learning_rate": 8.162093792566646e-05, "loss": 0.0077, "step": 134670 }, { "epoch": 1.46, "learning_rate": 8.160472206006357e-05, "loss": 0.0097, "step": 134680 }, { "epoch": 1.46, "learning_rate": 8.158850619446065e-05, "loss": 0.009, "step": 134690 }, { "epoch": 1.46, "learning_rate": 8.157229032885775e-05, "loss": 0.0099, "step": 134700 }, { "epoch": 1.46, "learning_rate": 8.155607446325483e-05, "loss": 0.0063, "step": 134710 }, { "epoch": 1.46, "learning_rate": 8.153985859765194e-05, "loss": 0.0085, "step": 134720 }, { "epoch": 1.46, "learning_rate": 8.152364273204903e-05, "loss": 0.0084, "step": 134730 }, { "epoch": 1.46, "learning_rate": 8.150742686644613e-05, "loss": 0.0074, "step": 134740 }, { "epoch": 1.46, "learning_rate": 8.149121100084322e-05, "loss": 0.0081, "step": 134750 }, { "epoch": 1.46, "learning_rate": 8.147499513524031e-05, "loss": 0.0072, "step": 134760 }, { "epoch": 1.46, "learning_rate": 8.14587792696374e-05, "loss": 0.0073, "step": 134770 }, { "epoch": 1.46, "learning_rate": 8.144256340403451e-05, "loss": 0.0088, "step": 134780 }, { "epoch": 1.46, "learning_rate": 8.142634753843159e-05, "loss": 0.0076, "step": 134790 }, { "epoch": 1.46, "learning_rate": 8.14101316728287e-05, "loss": 0.0089, "step": 134800 }, { "epoch": 1.46, "learning_rate": 8.139391580722577e-05, "loss": 0.0089, "step": 134810 }, { "epoch": 1.46, "learning_rate": 8.137769994162288e-05, "loss": 0.0095, "step": 134820 }, { "epoch": 1.46, "learning_rate": 8.136148407601997e-05, "loss": 0.0071, "step": 134830 }, { "epoch": 1.46, "learning_rate": 8.134526821041707e-05, "loss": 0.0058, "step": 134840 }, { "epoch": 1.46, "learning_rate": 8.132905234481416e-05, "loss": 0.0074, "step": 134850 }, { "epoch": 1.46, "learning_rate": 8.131283647921125e-05, "loss": 0.0072, "step": 134860 }, { "epoch": 1.46, "learning_rate": 8.129662061360834e-05, "loss": 0.0066, "step": 134870 }, { "epoch": 1.46, "learning_rate": 8.128040474800545e-05, "loss": 0.0091, "step": 134880 }, { "epoch": 1.46, "learning_rate": 8.126418888240253e-05, "loss": 0.008, "step": 134890 }, { "epoch": 1.46, "learning_rate": 8.124797301679964e-05, "loss": 0.011, "step": 134900 }, { "epoch": 1.46, "learning_rate": 8.123175715119672e-05, "loss": 0.0105, "step": 134910 }, { "epoch": 1.46, "learning_rate": 8.121554128559382e-05, "loss": 0.0058, "step": 134920 }, { "epoch": 1.46, "learning_rate": 8.11993254199909e-05, "loss": 0.0095, "step": 134930 }, { "epoch": 1.46, "learning_rate": 8.118310955438801e-05, "loss": 0.0079, "step": 134940 }, { "epoch": 1.46, "learning_rate": 8.11668936887851e-05, "loss": 0.0067, "step": 134950 }, { "epoch": 1.46, "learning_rate": 8.115067782318219e-05, "loss": 0.0128, "step": 134960 }, { "epoch": 1.46, "learning_rate": 8.113446195757929e-05, "loss": 0.0082, "step": 134970 }, { "epoch": 1.46, "learning_rate": 8.111824609197639e-05, "loss": 0.0085, "step": 134980 }, { "epoch": 1.46, "learning_rate": 8.110203022637347e-05, "loss": 0.009, "step": 134990 }, { "epoch": 1.46, "learning_rate": 8.108581436077058e-05, "loss": 0.0093, "step": 135000 }, { "epoch": 1.46, "eval_cer": 0.921567758848024, "eval_loss": 0.006778133567422628, "eval_runtime": 121.2762, "eval_samples_per_second": 16.491, "eval_steps_per_second": 4.123, "step": 135000 }, { "epoch": 1.46, "learning_rate": 8.106959849516766e-05, "loss": 0.0087, "step": 135010 }, { "epoch": 1.46, "learning_rate": 8.105338262956476e-05, "loss": 0.0065, "step": 135020 }, { "epoch": 1.46, "learning_rate": 8.103716676396184e-05, "loss": 0.0079, "step": 135030 }, { "epoch": 1.46, "learning_rate": 8.102095089835895e-05, "loss": 0.0098, "step": 135040 }, { "epoch": 1.46, "learning_rate": 8.100473503275604e-05, "loss": 0.0099, "step": 135050 }, { "epoch": 1.46, "learning_rate": 8.098851916715313e-05, "loss": 0.0084, "step": 135060 }, { "epoch": 1.46, "learning_rate": 8.097230330155023e-05, "loss": 0.0125, "step": 135070 }, { "epoch": 1.46, "learning_rate": 8.095608743594732e-05, "loss": 0.0085, "step": 135080 }, { "epoch": 1.46, "learning_rate": 8.093987157034441e-05, "loss": 0.008, "step": 135090 }, { "epoch": 1.46, "learning_rate": 8.092365570474152e-05, "loss": 0.0075, "step": 135100 }, { "epoch": 1.46, "learning_rate": 8.09074398391386e-05, "loss": 0.0067, "step": 135110 }, { "epoch": 1.46, "learning_rate": 8.08912239735357e-05, "loss": 0.0086, "step": 135120 }, { "epoch": 1.46, "learning_rate": 8.087500810793278e-05, "loss": 0.0074, "step": 135130 }, { "epoch": 1.46, "learning_rate": 8.085879224232989e-05, "loss": 0.0077, "step": 135140 }, { "epoch": 1.46, "learning_rate": 8.084257637672698e-05, "loss": 0.0075, "step": 135150 }, { "epoch": 1.46, "learning_rate": 8.082636051112407e-05, "loss": 0.0066, "step": 135160 }, { "epoch": 1.46, "learning_rate": 8.081014464552117e-05, "loss": 0.008, "step": 135170 }, { "epoch": 1.46, "learning_rate": 8.079392877991826e-05, "loss": 0.0071, "step": 135180 }, { "epoch": 1.46, "learning_rate": 8.077771291431535e-05, "loss": 0.0088, "step": 135190 }, { "epoch": 1.46, "learning_rate": 8.076149704871246e-05, "loss": 0.0076, "step": 135200 }, { "epoch": 1.46, "learning_rate": 8.074528118310954e-05, "loss": 0.0069, "step": 135210 }, { "epoch": 1.46, "learning_rate": 8.072906531750664e-05, "loss": 0.0073, "step": 135220 }, { "epoch": 1.46, "learning_rate": 8.071284945190374e-05, "loss": 0.0076, "step": 135230 }, { "epoch": 1.46, "learning_rate": 8.069663358630083e-05, "loss": 0.0091, "step": 135240 }, { "epoch": 1.46, "learning_rate": 8.068041772069794e-05, "loss": 0.0071, "step": 135250 }, { "epoch": 1.46, "learning_rate": 8.066420185509502e-05, "loss": 0.0066, "step": 135260 }, { "epoch": 1.46, "learning_rate": 8.064798598949212e-05, "loss": 0.0069, "step": 135270 }, { "epoch": 1.46, "learning_rate": 8.06317701238892e-05, "loss": 0.0082, "step": 135280 }, { "epoch": 1.46, "learning_rate": 8.061555425828631e-05, "loss": 0.0072, "step": 135290 }, { "epoch": 1.46, "learning_rate": 8.05993383926834e-05, "loss": 0.0075, "step": 135300 }, { "epoch": 1.46, "learning_rate": 8.058312252708049e-05, "loss": 0.0093, "step": 135310 }, { "epoch": 1.46, "learning_rate": 8.056690666147759e-05, "loss": 0.0085, "step": 135320 }, { "epoch": 1.46, "learning_rate": 8.055069079587468e-05, "loss": 0.0063, "step": 135330 }, { "epoch": 1.46, "learning_rate": 8.053447493027177e-05, "loss": 0.0058, "step": 135340 }, { "epoch": 1.46, "learning_rate": 8.051825906466888e-05, "loss": 0.0082, "step": 135350 }, { "epoch": 1.46, "learning_rate": 8.050204319906596e-05, "loss": 0.0085, "step": 135360 }, { "epoch": 1.46, "learning_rate": 8.048582733346306e-05, "loss": 0.0076, "step": 135370 }, { "epoch": 1.46, "learning_rate": 8.046961146786014e-05, "loss": 0.0074, "step": 135380 }, { "epoch": 1.46, "learning_rate": 8.045339560225725e-05, "loss": 0.0092, "step": 135390 }, { "epoch": 1.46, "learning_rate": 8.043717973665433e-05, "loss": 0.01, "step": 135400 }, { "epoch": 1.46, "learning_rate": 8.042096387105143e-05, "loss": 0.0066, "step": 135410 }, { "epoch": 1.46, "learning_rate": 8.040474800544853e-05, "loss": 0.0081, "step": 135420 }, { "epoch": 1.46, "learning_rate": 8.038853213984562e-05, "loss": 0.0074, "step": 135430 }, { "epoch": 1.46, "learning_rate": 8.037231627424271e-05, "loss": 0.0077, "step": 135440 }, { "epoch": 1.46, "learning_rate": 8.035610040863982e-05, "loss": 0.0085, "step": 135450 }, { "epoch": 1.46, "learning_rate": 8.03398845430369e-05, "loss": 0.0101, "step": 135460 }, { "epoch": 1.46, "learning_rate": 8.0323668677434e-05, "loss": 0.0058, "step": 135470 }, { "epoch": 1.46, "learning_rate": 8.030745281183108e-05, "loss": 0.0064, "step": 135480 }, { "epoch": 1.46, "learning_rate": 8.029123694622819e-05, "loss": 0.0083, "step": 135490 }, { "epoch": 1.46, "learning_rate": 8.027502108062527e-05, "loss": 0.0066, "step": 135500 }, { "epoch": 1.46, "learning_rate": 8.025880521502237e-05, "loss": 0.0094, "step": 135510 }, { "epoch": 1.47, "learning_rate": 8.024258934941947e-05, "loss": 0.0092, "step": 135520 }, { "epoch": 1.47, "learning_rate": 8.022637348381656e-05, "loss": 0.0059, "step": 135530 }, { "epoch": 1.47, "learning_rate": 8.021015761821365e-05, "loss": 0.008, "step": 135540 }, { "epoch": 1.47, "learning_rate": 8.019394175261075e-05, "loss": 0.0063, "step": 135550 }, { "epoch": 1.47, "learning_rate": 8.017772588700784e-05, "loss": 0.0078, "step": 135560 }, { "epoch": 1.47, "learning_rate": 8.016151002140494e-05, "loss": 0.0073, "step": 135570 }, { "epoch": 1.47, "learning_rate": 8.014529415580202e-05, "loss": 0.0074, "step": 135580 }, { "epoch": 1.47, "learning_rate": 8.012907829019913e-05, "loss": 0.0067, "step": 135590 }, { "epoch": 1.47, "learning_rate": 8.011286242459621e-05, "loss": 0.0093, "step": 135600 }, { "epoch": 1.47, "learning_rate": 8.009664655899332e-05, "loss": 0.0078, "step": 135610 }, { "epoch": 1.47, "learning_rate": 8.00804306933904e-05, "loss": 0.0083, "step": 135620 }, { "epoch": 1.47, "learning_rate": 8.00642148277875e-05, "loss": 0.0087, "step": 135630 }, { "epoch": 1.47, "learning_rate": 8.00479989621846e-05, "loss": 0.0091, "step": 135640 }, { "epoch": 1.47, "learning_rate": 8.003178309658169e-05, "loss": 0.0075, "step": 135650 }, { "epoch": 1.47, "learning_rate": 8.001556723097878e-05, "loss": 0.0076, "step": 135660 }, { "epoch": 1.47, "learning_rate": 7.999935136537589e-05, "loss": 0.0098, "step": 135670 }, { "epoch": 1.47, "learning_rate": 7.998313549977297e-05, "loss": 0.0082, "step": 135680 }, { "epoch": 1.47, "learning_rate": 7.996691963417007e-05, "loss": 0.0081, "step": 135690 }, { "epoch": 1.47, "learning_rate": 7.995070376856715e-05, "loss": 0.0069, "step": 135700 }, { "epoch": 1.47, "learning_rate": 7.993448790296426e-05, "loss": 0.0075, "step": 135710 }, { "epoch": 1.47, "learning_rate": 7.991827203736134e-05, "loss": 0.0097, "step": 135720 }, { "epoch": 1.47, "learning_rate": 7.990205617175844e-05, "loss": 0.009, "step": 135730 }, { "epoch": 1.47, "learning_rate": 7.988584030615554e-05, "loss": 0.0068, "step": 135740 }, { "epoch": 1.47, "learning_rate": 7.986962444055263e-05, "loss": 0.0109, "step": 135750 }, { "epoch": 1.47, "learning_rate": 7.985340857494972e-05, "loss": 0.0107, "step": 135760 }, { "epoch": 1.47, "learning_rate": 7.983719270934681e-05, "loss": 0.0086, "step": 135770 }, { "epoch": 1.47, "learning_rate": 7.98209768437439e-05, "loss": 0.0077, "step": 135780 }, { "epoch": 1.47, "learning_rate": 7.980476097814101e-05, "loss": 0.0089, "step": 135790 }, { "epoch": 1.47, "learning_rate": 7.978854511253809e-05, "loss": 0.0091, "step": 135800 }, { "epoch": 1.47, "learning_rate": 7.97723292469352e-05, "loss": 0.0083, "step": 135810 }, { "epoch": 1.47, "learning_rate": 7.975611338133228e-05, "loss": 0.0079, "step": 135820 }, { "epoch": 1.47, "learning_rate": 7.973989751572938e-05, "loss": 0.0076, "step": 135830 }, { "epoch": 1.47, "learning_rate": 7.972368165012648e-05, "loss": 0.0078, "step": 135840 }, { "epoch": 1.47, "learning_rate": 7.970746578452357e-05, "loss": 0.0097, "step": 135850 }, { "epoch": 1.47, "learning_rate": 7.969124991892066e-05, "loss": 0.0078, "step": 135860 }, { "epoch": 1.47, "learning_rate": 7.967503405331775e-05, "loss": 0.0078, "step": 135870 }, { "epoch": 1.47, "learning_rate": 7.965881818771485e-05, "loss": 0.0073, "step": 135880 }, { "epoch": 1.47, "learning_rate": 7.964260232211195e-05, "loss": 0.0109, "step": 135890 }, { "epoch": 1.47, "learning_rate": 7.962638645650903e-05, "loss": 0.0123, "step": 135900 }, { "epoch": 1.47, "learning_rate": 7.961017059090614e-05, "loss": 0.0086, "step": 135910 }, { "epoch": 1.47, "learning_rate": 7.959395472530322e-05, "loss": 0.0069, "step": 135920 }, { "epoch": 1.47, "learning_rate": 7.957773885970032e-05, "loss": 0.0078, "step": 135930 }, { "epoch": 1.47, "learning_rate": 7.95615229940974e-05, "loss": 0.0079, "step": 135940 }, { "epoch": 1.47, "learning_rate": 7.954530712849451e-05, "loss": 0.0094, "step": 135950 }, { "epoch": 1.47, "learning_rate": 7.952909126289162e-05, "loss": 0.0085, "step": 135960 }, { "epoch": 1.47, "learning_rate": 7.95128753972887e-05, "loss": 0.0079, "step": 135970 }, { "epoch": 1.47, "learning_rate": 7.94966595316858e-05, "loss": 0.01, "step": 135980 }, { "epoch": 1.47, "learning_rate": 7.94804436660829e-05, "loss": 0.0082, "step": 135990 }, { "epoch": 1.47, "learning_rate": 7.946422780047999e-05, "loss": 0.009, "step": 136000 }, { "epoch": 1.47, "eval_cer": 0.9215312775238562, "eval_loss": 0.006653364282101393, "eval_runtime": 121.3191, "eval_samples_per_second": 16.485, "eval_steps_per_second": 4.121, "step": 136000 }, { "epoch": 1.47, "learning_rate": 7.944801193487708e-05, "loss": 0.0085, "step": 136010 }, { "epoch": 1.47, "learning_rate": 7.943179606927417e-05, "loss": 0.0108, "step": 136020 }, { "epoch": 1.47, "learning_rate": 7.941558020367127e-05, "loss": 0.0083, "step": 136030 }, { "epoch": 1.47, "learning_rate": 7.939936433806837e-05, "loss": 0.007, "step": 136040 }, { "epoch": 1.47, "learning_rate": 7.938314847246545e-05, "loss": 0.0092, "step": 136050 }, { "epoch": 1.47, "learning_rate": 7.936693260686256e-05, "loss": 0.0054, "step": 136060 }, { "epoch": 1.47, "learning_rate": 7.935071674125964e-05, "loss": 0.0078, "step": 136070 }, { "epoch": 1.47, "learning_rate": 7.933450087565674e-05, "loss": 0.0087, "step": 136080 }, { "epoch": 1.47, "learning_rate": 7.931828501005382e-05, "loss": 0.0091, "step": 136090 }, { "epoch": 1.47, "learning_rate": 7.930206914445093e-05, "loss": 0.0077, "step": 136100 }, { "epoch": 1.47, "learning_rate": 7.928585327884802e-05, "loss": 0.0092, "step": 136110 }, { "epoch": 1.47, "learning_rate": 7.926963741324511e-05, "loss": 0.0105, "step": 136120 }, { "epoch": 1.47, "learning_rate": 7.92534215476422e-05, "loss": 0.0084, "step": 136130 }, { "epoch": 1.47, "learning_rate": 7.923720568203931e-05, "loss": 0.0075, "step": 136140 }, { "epoch": 1.47, "learning_rate": 7.922098981643639e-05, "loss": 0.007, "step": 136150 }, { "epoch": 1.47, "learning_rate": 7.92047739508335e-05, "loss": 0.0124, "step": 136160 }, { "epoch": 1.47, "learning_rate": 7.918855808523058e-05, "loss": 0.0078, "step": 136170 }, { "epoch": 1.47, "learning_rate": 7.917234221962768e-05, "loss": 0.0108, "step": 136180 }, { "epoch": 1.47, "learning_rate": 7.915612635402476e-05, "loss": 0.0105, "step": 136190 }, { "epoch": 1.47, "learning_rate": 7.913991048842187e-05, "loss": 0.0077, "step": 136200 }, { "epoch": 1.47, "learning_rate": 7.912369462281896e-05, "loss": 0.0092, "step": 136210 }, { "epoch": 1.47, "learning_rate": 7.910747875721605e-05, "loss": 0.0075, "step": 136220 }, { "epoch": 1.47, "learning_rate": 7.909126289161315e-05, "loss": 0.0102, "step": 136230 }, { "epoch": 1.47, "learning_rate": 7.907504702601024e-05, "loss": 0.0095, "step": 136240 }, { "epoch": 1.47, "learning_rate": 7.905883116040733e-05, "loss": 0.0097, "step": 136250 }, { "epoch": 1.47, "learning_rate": 7.904261529480444e-05, "loss": 0.0104, "step": 136260 }, { "epoch": 1.47, "learning_rate": 7.902639942920152e-05, "loss": 0.0075, "step": 136270 }, { "epoch": 1.47, "learning_rate": 7.901018356359862e-05, "loss": 0.0083, "step": 136280 }, { "epoch": 1.47, "learning_rate": 7.89939676979957e-05, "loss": 0.0088, "step": 136290 }, { "epoch": 1.47, "learning_rate": 7.897775183239281e-05, "loss": 0.0081, "step": 136300 }, { "epoch": 1.47, "learning_rate": 7.89615359667899e-05, "loss": 0.0085, "step": 136310 }, { "epoch": 1.47, "learning_rate": 7.8945320101187e-05, "loss": 0.0063, "step": 136320 }, { "epoch": 1.47, "learning_rate": 7.892910423558409e-05, "loss": 0.0077, "step": 136330 }, { "epoch": 1.47, "learning_rate": 7.891288836998118e-05, "loss": 0.0101, "step": 136340 }, { "epoch": 1.47, "learning_rate": 7.889667250437827e-05, "loss": 0.0082, "step": 136350 }, { "epoch": 1.47, "learning_rate": 7.888045663877538e-05, "loss": 0.0083, "step": 136360 }, { "epoch": 1.47, "learning_rate": 7.886424077317246e-05, "loss": 0.0084, "step": 136370 }, { "epoch": 1.47, "learning_rate": 7.884802490756957e-05, "loss": 0.0064, "step": 136380 }, { "epoch": 1.47, "learning_rate": 7.883180904196664e-05, "loss": 0.0085, "step": 136390 }, { "epoch": 1.47, "learning_rate": 7.881559317636375e-05, "loss": 0.0085, "step": 136400 }, { "epoch": 1.47, "learning_rate": 7.879937731076083e-05, "loss": 0.0076, "step": 136410 }, { "epoch": 1.47, "learning_rate": 7.878316144515794e-05, "loss": 0.0087, "step": 136420 }, { "epoch": 1.47, "learning_rate": 7.876694557955503e-05, "loss": 0.0091, "step": 136430 }, { "epoch": 1.47, "learning_rate": 7.875072971395212e-05, "loss": 0.0075, "step": 136440 }, { "epoch": 1.48, "learning_rate": 7.873451384834921e-05, "loss": 0.0097, "step": 136450 }, { "epoch": 1.48, "learning_rate": 7.871829798274632e-05, "loss": 0.0088, "step": 136460 }, { "epoch": 1.48, "learning_rate": 7.87020821171434e-05, "loss": 0.0068, "step": 136470 }, { "epoch": 1.48, "learning_rate": 7.86858662515405e-05, "loss": 0.0094, "step": 136480 }, { "epoch": 1.48, "learning_rate": 7.866965038593759e-05, "loss": 0.0073, "step": 136490 }, { "epoch": 1.48, "learning_rate": 7.865343452033469e-05, "loss": 0.0087, "step": 136500 }, { "epoch": 1.48, "learning_rate": 7.863721865473177e-05, "loss": 0.0081, "step": 136510 }, { "epoch": 1.48, "learning_rate": 7.862100278912888e-05, "loss": 0.0101, "step": 136520 }, { "epoch": 1.48, "learning_rate": 7.860478692352597e-05, "loss": 0.0084, "step": 136530 }, { "epoch": 1.48, "learning_rate": 7.858857105792306e-05, "loss": 0.0099, "step": 136540 }, { "epoch": 1.48, "learning_rate": 7.857235519232016e-05, "loss": 0.0063, "step": 136550 }, { "epoch": 1.48, "learning_rate": 7.855613932671725e-05, "loss": 0.0073, "step": 136560 }, { "epoch": 1.48, "learning_rate": 7.853992346111434e-05, "loss": 0.0105, "step": 136570 }, { "epoch": 1.48, "learning_rate": 7.852370759551145e-05, "loss": 0.0068, "step": 136580 }, { "epoch": 1.48, "learning_rate": 7.850749172990853e-05, "loss": 0.0065, "step": 136590 }, { "epoch": 1.48, "learning_rate": 7.849127586430563e-05, "loss": 0.0088, "step": 136600 }, { "epoch": 1.48, "learning_rate": 7.847505999870271e-05, "loss": 0.0081, "step": 136610 }, { "epoch": 1.48, "learning_rate": 7.845884413309982e-05, "loss": 0.0073, "step": 136620 }, { "epoch": 1.48, "learning_rate": 7.84426282674969e-05, "loss": 0.006, "step": 136630 }, { "epoch": 1.48, "learning_rate": 7.8426412401894e-05, "loss": 0.0111, "step": 136640 }, { "epoch": 1.48, "learning_rate": 7.84101965362911e-05, "loss": 0.0086, "step": 136650 }, { "epoch": 1.48, "learning_rate": 7.839398067068819e-05, "loss": 0.01, "step": 136660 }, { "epoch": 1.48, "learning_rate": 7.83777648050853e-05, "loss": 0.0066, "step": 136670 }, { "epoch": 1.48, "learning_rate": 7.836154893948239e-05, "loss": 0.0095, "step": 136680 }, { "epoch": 1.48, "learning_rate": 7.834533307387948e-05, "loss": 0.0091, "step": 136690 }, { "epoch": 1.48, "learning_rate": 7.832911720827657e-05, "loss": 0.0061, "step": 136700 }, { "epoch": 1.48, "learning_rate": 7.831290134267367e-05, "loss": 0.009, "step": 136710 }, { "epoch": 1.48, "learning_rate": 7.829668547707076e-05, "loss": 0.0098, "step": 136720 }, { "epoch": 1.48, "learning_rate": 7.828046961146787e-05, "loss": 0.006, "step": 136730 }, { "epoch": 1.48, "learning_rate": 7.826425374586494e-05, "loss": 0.0089, "step": 136740 }, { "epoch": 1.48, "learning_rate": 7.824803788026205e-05, "loss": 0.0085, "step": 136750 }, { "epoch": 1.48, "learning_rate": 7.823182201465913e-05, "loss": 0.0089, "step": 136760 }, { "epoch": 1.48, "learning_rate": 7.821560614905624e-05, "loss": 0.009, "step": 136770 }, { "epoch": 1.48, "learning_rate": 7.819939028345332e-05, "loss": 0.0061, "step": 136780 }, { "epoch": 1.48, "learning_rate": 7.818317441785042e-05, "loss": 0.0098, "step": 136790 }, { "epoch": 1.48, "learning_rate": 7.816695855224752e-05, "loss": 0.0068, "step": 136800 }, { "epoch": 1.48, "learning_rate": 7.815074268664461e-05, "loss": 0.0061, "step": 136810 }, { "epoch": 1.48, "learning_rate": 7.81345268210417e-05, "loss": 0.0104, "step": 136820 }, { "epoch": 1.48, "learning_rate": 7.811831095543881e-05, "loss": 0.0081, "step": 136830 }, { "epoch": 1.48, "learning_rate": 7.810209508983589e-05, "loss": 0.0102, "step": 136840 }, { "epoch": 1.48, "learning_rate": 7.808587922423299e-05, "loss": 0.0066, "step": 136850 }, { "epoch": 1.48, "learning_rate": 7.806966335863007e-05, "loss": 0.0076, "step": 136860 }, { "epoch": 1.48, "learning_rate": 7.805344749302718e-05, "loss": 0.0074, "step": 136870 }, { "epoch": 1.48, "learning_rate": 7.803723162742426e-05, "loss": 0.0078, "step": 136880 }, { "epoch": 1.48, "learning_rate": 7.802101576182136e-05, "loss": 0.0085, "step": 136890 }, { "epoch": 1.48, "learning_rate": 7.800479989621846e-05, "loss": 0.0077, "step": 136900 }, { "epoch": 1.48, "learning_rate": 7.798858403061555e-05, "loss": 0.0069, "step": 136910 }, { "epoch": 1.48, "learning_rate": 7.797236816501264e-05, "loss": 0.0064, "step": 136920 }, { "epoch": 1.48, "learning_rate": 7.795615229940973e-05, "loss": 0.008, "step": 136930 }, { "epoch": 1.48, "learning_rate": 7.793993643380683e-05, "loss": 0.006, "step": 136940 }, { "epoch": 1.48, "learning_rate": 7.792372056820393e-05, "loss": 0.0094, "step": 136950 }, { "epoch": 1.48, "learning_rate": 7.790750470260101e-05, "loss": 0.008, "step": 136960 }, { "epoch": 1.48, "learning_rate": 7.789128883699812e-05, "loss": 0.0085, "step": 136970 }, { "epoch": 1.48, "learning_rate": 7.78750729713952e-05, "loss": 0.0067, "step": 136980 }, { "epoch": 1.48, "learning_rate": 7.78588571057923e-05, "loss": 0.0084, "step": 136990 }, { "epoch": 1.48, "learning_rate": 7.78426412401894e-05, "loss": 0.0083, "step": 137000 }, { "epoch": 1.48, "eval_cer": 0.9215529925977656, "eval_loss": 0.006497697904706001, "eval_runtime": 121.1874, "eval_samples_per_second": 16.503, "eval_steps_per_second": 4.126, "step": 137000 }, { "epoch": 1.48, "learning_rate": 7.782642537458649e-05, "loss": 0.0112, "step": 137010 }, { "epoch": 1.48, "learning_rate": 7.781020950898358e-05, "loss": 0.0082, "step": 137020 }, { "epoch": 1.48, "learning_rate": 7.779399364338068e-05, "loss": 0.0076, "step": 137030 }, { "epoch": 1.48, "learning_rate": 7.777777777777777e-05, "loss": 0.0078, "step": 137040 }, { "epoch": 1.48, "learning_rate": 7.776156191217487e-05, "loss": 0.0072, "step": 137050 }, { "epoch": 1.48, "learning_rate": 7.774534604657195e-05, "loss": 0.0086, "step": 137060 }, { "epoch": 1.48, "learning_rate": 7.772913018096906e-05, "loss": 0.0083, "step": 137070 }, { "epoch": 1.48, "learning_rate": 7.771291431536614e-05, "loss": 0.0063, "step": 137080 }, { "epoch": 1.48, "learning_rate": 7.769669844976325e-05, "loss": 0.0071, "step": 137090 }, { "epoch": 1.48, "learning_rate": 7.768048258416032e-05, "loss": 0.0081, "step": 137100 }, { "epoch": 1.48, "learning_rate": 7.766426671855743e-05, "loss": 0.0067, "step": 137110 }, { "epoch": 1.48, "learning_rate": 7.764805085295452e-05, "loss": 0.0079, "step": 137120 }, { "epoch": 1.48, "learning_rate": 7.763183498735162e-05, "loss": 0.0081, "step": 137130 }, { "epoch": 1.48, "learning_rate": 7.761561912174871e-05, "loss": 0.0082, "step": 137140 }, { "epoch": 1.48, "learning_rate": 7.759940325614582e-05, "loss": 0.0108, "step": 137150 }, { "epoch": 1.48, "learning_rate": 7.75831873905429e-05, "loss": 0.0097, "step": 137160 }, { "epoch": 1.48, "learning_rate": 7.756697152494e-05, "loss": 0.0098, "step": 137170 }, { "epoch": 1.48, "learning_rate": 7.755075565933708e-05, "loss": 0.0058, "step": 137180 }, { "epoch": 1.48, "learning_rate": 7.753453979373419e-05, "loss": 0.0072, "step": 137190 }, { "epoch": 1.48, "learning_rate": 7.751832392813127e-05, "loss": 0.0074, "step": 137200 }, { "epoch": 1.48, "learning_rate": 7.750210806252837e-05, "loss": 0.0077, "step": 137210 }, { "epoch": 1.48, "learning_rate": 7.748589219692546e-05, "loss": 0.0087, "step": 137220 }, { "epoch": 1.48, "learning_rate": 7.746967633132256e-05, "loss": 0.0105, "step": 137230 }, { "epoch": 1.48, "learning_rate": 7.745346046571965e-05, "loss": 0.0098, "step": 137240 }, { "epoch": 1.48, "learning_rate": 7.743724460011674e-05, "loss": 0.0068, "step": 137250 }, { "epoch": 1.48, "learning_rate": 7.742102873451384e-05, "loss": 0.0089, "step": 137260 }, { "epoch": 1.48, "learning_rate": 7.740481286891094e-05, "loss": 0.0059, "step": 137270 }, { "epoch": 1.48, "learning_rate": 7.738859700330802e-05, "loss": 0.0089, "step": 137280 }, { "epoch": 1.48, "learning_rate": 7.737238113770513e-05, "loss": 0.0099, "step": 137290 }, { "epoch": 1.48, "learning_rate": 7.73561652721022e-05, "loss": 0.0106, "step": 137300 }, { "epoch": 1.48, "learning_rate": 7.733994940649931e-05, "loss": 0.0075, "step": 137310 }, { "epoch": 1.48, "learning_rate": 7.73237335408964e-05, "loss": 0.0107, "step": 137320 }, { "epoch": 1.48, "learning_rate": 7.73075176752935e-05, "loss": 0.0081, "step": 137330 }, { "epoch": 1.48, "learning_rate": 7.729130180969059e-05, "loss": 0.0118, "step": 137340 }, { "epoch": 1.48, "learning_rate": 7.727508594408768e-05, "loss": 0.0097, "step": 137350 }, { "epoch": 1.48, "learning_rate": 7.725887007848478e-05, "loss": 0.0085, "step": 137360 }, { "epoch": 1.49, "learning_rate": 7.724265421288188e-05, "loss": 0.0104, "step": 137370 }, { "epoch": 1.49, "learning_rate": 7.722643834727896e-05, "loss": 0.0084, "step": 137380 }, { "epoch": 1.49, "learning_rate": 7.721022248167607e-05, "loss": 0.0086, "step": 137390 }, { "epoch": 1.49, "learning_rate": 7.719400661607316e-05, "loss": 0.0071, "step": 137400 }, { "epoch": 1.49, "learning_rate": 7.717779075047025e-05, "loss": 0.007, "step": 137410 }, { "epoch": 1.49, "learning_rate": 7.716157488486736e-05, "loss": 0.0083, "step": 137420 }, { "epoch": 1.49, "learning_rate": 7.714535901926444e-05, "loss": 0.0078, "step": 137430 }, { "epoch": 1.49, "learning_rate": 7.712914315366155e-05, "loss": 0.008, "step": 137440 }, { "epoch": 1.49, "learning_rate": 7.711292728805862e-05, "loss": 0.0081, "step": 137450 }, { "epoch": 1.49, "learning_rate": 7.709671142245573e-05, "loss": 0.0076, "step": 137460 }, { "epoch": 1.49, "learning_rate": 7.708049555685282e-05, "loss": 0.0068, "step": 137470 }, { "epoch": 1.49, "learning_rate": 7.706427969124992e-05, "loss": 0.0072, "step": 137480 }, { "epoch": 1.49, "learning_rate": 7.704806382564701e-05, "loss": 0.0092, "step": 137490 }, { "epoch": 1.49, "learning_rate": 7.70318479600441e-05, "loss": 0.0092, "step": 137500 }, { "epoch": 1.49, "learning_rate": 7.70156320944412e-05, "loss": 0.0081, "step": 137510 }, { "epoch": 1.49, "learning_rate": 7.69994162288383e-05, "loss": 0.0081, "step": 137520 }, { "epoch": 1.49, "learning_rate": 7.698320036323538e-05, "loss": 0.0093, "step": 137530 }, { "epoch": 1.49, "learning_rate": 7.696698449763249e-05, "loss": 0.0068, "step": 137540 }, { "epoch": 1.49, "learning_rate": 7.695076863202957e-05, "loss": 0.0088, "step": 137550 }, { "epoch": 1.49, "learning_rate": 7.693455276642667e-05, "loss": 0.0107, "step": 137560 }, { "epoch": 1.49, "learning_rate": 7.691833690082375e-05, "loss": 0.0091, "step": 137570 }, { "epoch": 1.49, "learning_rate": 7.690212103522086e-05, "loss": 0.0086, "step": 137580 }, { "epoch": 1.49, "learning_rate": 7.688590516961795e-05, "loss": 0.0076, "step": 137590 }, { "epoch": 1.49, "learning_rate": 7.686968930401504e-05, "loss": 0.0073, "step": 137600 }, { "epoch": 1.49, "learning_rate": 7.685347343841214e-05, "loss": 0.0078, "step": 137610 }, { "epoch": 1.49, "learning_rate": 7.683725757280924e-05, "loss": 0.0083, "step": 137620 }, { "epoch": 1.49, "learning_rate": 7.682104170720632e-05, "loss": 0.0074, "step": 137630 }, { "epoch": 1.49, "learning_rate": 7.680482584160343e-05, "loss": 0.0092, "step": 137640 }, { "epoch": 1.49, "learning_rate": 7.67886099760005e-05, "loss": 0.0103, "step": 137650 }, { "epoch": 1.49, "learning_rate": 7.677239411039761e-05, "loss": 0.0065, "step": 137660 }, { "epoch": 1.49, "learning_rate": 7.675617824479469e-05, "loss": 0.0072, "step": 137670 }, { "epoch": 1.49, "learning_rate": 7.67399623791918e-05, "loss": 0.0076, "step": 137680 }, { "epoch": 1.49, "learning_rate": 7.672374651358889e-05, "loss": 0.0099, "step": 137690 }, { "epoch": 1.49, "learning_rate": 7.670753064798598e-05, "loss": 0.0107, "step": 137700 }, { "epoch": 1.49, "learning_rate": 7.669131478238308e-05, "loss": 0.0055, "step": 137710 }, { "epoch": 1.49, "learning_rate": 7.667509891678017e-05, "loss": 0.0079, "step": 137720 }, { "epoch": 1.49, "learning_rate": 7.665888305117726e-05, "loss": 0.0083, "step": 137730 }, { "epoch": 1.49, "learning_rate": 7.664266718557437e-05, "loss": 0.008, "step": 137740 }, { "epoch": 1.49, "learning_rate": 7.662645131997145e-05, "loss": 0.0085, "step": 137750 }, { "epoch": 1.49, "learning_rate": 7.661023545436855e-05, "loss": 0.0084, "step": 137760 }, { "epoch": 1.49, "learning_rate": 7.659401958876563e-05, "loss": 0.0086, "step": 137770 }, { "epoch": 1.49, "learning_rate": 7.657780372316274e-05, "loss": 0.0081, "step": 137780 }, { "epoch": 1.49, "learning_rate": 7.656158785755982e-05, "loss": 0.0081, "step": 137790 }, { "epoch": 1.49, "learning_rate": 7.654537199195692e-05, "loss": 0.0081, "step": 137800 }, { "epoch": 1.49, "learning_rate": 7.652915612635402e-05, "loss": 0.0077, "step": 137810 }, { "epoch": 1.49, "learning_rate": 7.651294026075111e-05, "loss": 0.0079, "step": 137820 }, { "epoch": 1.49, "learning_rate": 7.64967243951482e-05, "loss": 0.0074, "step": 137830 }, { "epoch": 1.49, "learning_rate": 7.648050852954531e-05, "loss": 0.0076, "step": 137840 }, { "epoch": 1.49, "learning_rate": 7.646429266394239e-05, "loss": 0.0077, "step": 137850 }, { "epoch": 1.49, "learning_rate": 7.64480767983395e-05, "loss": 0.0071, "step": 137860 }, { "epoch": 1.49, "learning_rate": 7.643186093273657e-05, "loss": 0.0067, "step": 137870 }, { "epoch": 1.49, "learning_rate": 7.641564506713368e-05, "loss": 0.0062, "step": 137880 }, { "epoch": 1.49, "learning_rate": 7.639942920153076e-05, "loss": 0.0085, "step": 137890 }, { "epoch": 1.49, "learning_rate": 7.638321333592787e-05, "loss": 0.0099, "step": 137900 }, { "epoch": 1.49, "learning_rate": 7.636699747032496e-05, "loss": 0.0084, "step": 137910 }, { "epoch": 1.49, "learning_rate": 7.635078160472205e-05, "loss": 0.0071, "step": 137920 }, { "epoch": 1.49, "learning_rate": 7.633456573911914e-05, "loss": 0.0068, "step": 137930 }, { "epoch": 1.49, "learning_rate": 7.631834987351624e-05, "loss": 0.0077, "step": 137940 }, { "epoch": 1.49, "learning_rate": 7.630213400791333e-05, "loss": 0.01, "step": 137950 }, { "epoch": 1.49, "learning_rate": 7.628591814231044e-05, "loss": 0.0115, "step": 137960 }, { "epoch": 1.49, "learning_rate": 7.626970227670752e-05, "loss": 0.0085, "step": 137970 }, { "epoch": 1.49, "learning_rate": 7.625348641110462e-05, "loss": 0.009, "step": 137980 }, { "epoch": 1.49, "learning_rate": 7.62372705455017e-05, "loss": 0.0097, "step": 137990 }, { "epoch": 1.49, "learning_rate": 7.622105467989881e-05, "loss": 0.0108, "step": 138000 }, { "epoch": 1.49, "eval_cer": 0.9215364891415945, "eval_loss": 0.006428159307688475, "eval_runtime": 121.4519, "eval_samples_per_second": 16.467, "eval_steps_per_second": 4.117, "step": 138000 }, { "epoch": 1.49, "learning_rate": 7.62048388142959e-05, "loss": 0.0076, "step": 138010 }, { "epoch": 1.49, "learning_rate": 7.618862294869299e-05, "loss": 0.007, "step": 138020 }, { "epoch": 1.49, "learning_rate": 7.617240708309009e-05, "loss": 0.0083, "step": 138030 }, { "epoch": 1.49, "learning_rate": 7.615619121748718e-05, "loss": 0.0072, "step": 138040 }, { "epoch": 1.49, "learning_rate": 7.613997535188427e-05, "loss": 0.0084, "step": 138050 }, { "epoch": 1.49, "learning_rate": 7.612375948628138e-05, "loss": 0.011, "step": 138060 }, { "epoch": 1.49, "learning_rate": 7.610754362067846e-05, "loss": 0.0076, "step": 138070 }, { "epoch": 1.49, "learning_rate": 7.609132775507556e-05, "loss": 0.0079, "step": 138080 }, { "epoch": 1.49, "learning_rate": 7.607511188947264e-05, "loss": 0.0068, "step": 138090 }, { "epoch": 1.49, "learning_rate": 7.605889602386975e-05, "loss": 0.0075, "step": 138100 }, { "epoch": 1.49, "learning_rate": 7.604268015826685e-05, "loss": 0.0087, "step": 138110 }, { "epoch": 1.49, "learning_rate": 7.602646429266393e-05, "loss": 0.0095, "step": 138120 }, { "epoch": 1.49, "learning_rate": 7.601024842706104e-05, "loss": 0.0079, "step": 138130 }, { "epoch": 1.49, "learning_rate": 7.599403256145812e-05, "loss": 0.0086, "step": 138140 }, { "epoch": 1.49, "learning_rate": 7.597781669585523e-05, "loss": 0.0065, "step": 138150 }, { "epoch": 1.49, "learning_rate": 7.596160083025232e-05, "loss": 0.0064, "step": 138160 }, { "epoch": 1.49, "learning_rate": 7.594538496464941e-05, "loss": 0.0084, "step": 138170 }, { "epoch": 1.49, "learning_rate": 7.59291690990465e-05, "loss": 0.0104, "step": 138180 }, { "epoch": 1.49, "learning_rate": 7.59129532334436e-05, "loss": 0.0064, "step": 138190 }, { "epoch": 1.49, "learning_rate": 7.589673736784069e-05, "loss": 0.0085, "step": 138200 }, { "epoch": 1.49, "learning_rate": 7.58805215022378e-05, "loss": 0.0077, "step": 138210 }, { "epoch": 1.49, "learning_rate": 7.586430563663487e-05, "loss": 0.0106, "step": 138220 }, { "epoch": 1.49, "learning_rate": 7.584808977103198e-05, "loss": 0.0066, "step": 138230 }, { "epoch": 1.49, "learning_rate": 7.583187390542906e-05, "loss": 0.0087, "step": 138240 }, { "epoch": 1.49, "learning_rate": 7.581565803982617e-05, "loss": 0.0079, "step": 138250 }, { "epoch": 1.49, "learning_rate": 7.579944217422325e-05, "loss": 0.008, "step": 138260 }, { "epoch": 1.49, "learning_rate": 7.578322630862035e-05, "loss": 0.0076, "step": 138270 }, { "epoch": 1.49, "learning_rate": 7.576701044301744e-05, "loss": 0.0082, "step": 138280 }, { "epoch": 1.49, "learning_rate": 7.575079457741454e-05, "loss": 0.0102, "step": 138290 }, { "epoch": 1.5, "learning_rate": 7.573457871181163e-05, "loss": 0.0077, "step": 138300 }, { "epoch": 1.5, "learning_rate": 7.571836284620874e-05, "loss": 0.0056, "step": 138310 }, { "epoch": 1.5, "learning_rate": 7.570214698060582e-05, "loss": 0.009, "step": 138320 }, { "epoch": 1.5, "learning_rate": 7.568593111500292e-05, "loss": 0.0089, "step": 138330 }, { "epoch": 1.5, "learning_rate": 7.56697152494e-05, "loss": 0.0094, "step": 138340 }, { "epoch": 1.5, "learning_rate": 7.565349938379711e-05, "loss": 0.0077, "step": 138350 }, { "epoch": 1.5, "learning_rate": 7.563728351819419e-05, "loss": 0.0086, "step": 138360 }, { "epoch": 1.5, "learning_rate": 7.562106765259129e-05, "loss": 0.01, "step": 138370 }, { "epoch": 1.5, "learning_rate": 7.560485178698839e-05, "loss": 0.0072, "step": 138380 }, { "epoch": 1.5, "learning_rate": 7.558863592138548e-05, "loss": 0.0067, "step": 138390 }, { "epoch": 1.5, "learning_rate": 7.557242005578257e-05, "loss": 0.0083, "step": 138400 }, { "epoch": 1.5, "learning_rate": 7.555620419017966e-05, "loss": 0.008, "step": 138410 }, { "epoch": 1.5, "learning_rate": 7.553998832457676e-05, "loss": 0.0092, "step": 138420 }, { "epoch": 1.5, "learning_rate": 7.552377245897386e-05, "loss": 0.0084, "step": 138430 }, { "epoch": 1.5, "learning_rate": 7.550755659337094e-05, "loss": 0.0086, "step": 138440 }, { "epoch": 1.5, "learning_rate": 7.549134072776805e-05, "loss": 0.01, "step": 138450 }, { "epoch": 1.5, "learning_rate": 7.547512486216513e-05, "loss": 0.01, "step": 138460 }, { "epoch": 1.5, "learning_rate": 7.545890899656223e-05, "loss": 0.0075, "step": 138470 }, { "epoch": 1.5, "learning_rate": 7.544269313095933e-05, "loss": 0.0068, "step": 138480 }, { "epoch": 1.5, "learning_rate": 7.542647726535642e-05, "loss": 0.0079, "step": 138490 }, { "epoch": 1.5, "learning_rate": 7.541026139975351e-05, "loss": 0.0099, "step": 138500 }, { "epoch": 1.5, "learning_rate": 7.53940455341506e-05, "loss": 0.0088, "step": 138510 }, { "epoch": 1.5, "learning_rate": 7.53778296685477e-05, "loss": 0.0086, "step": 138520 }, { "epoch": 1.5, "learning_rate": 7.53616138029448e-05, "loss": 0.0063, "step": 138530 }, { "epoch": 1.5, "learning_rate": 7.534539793734188e-05, "loss": 0.0097, "step": 138540 }, { "epoch": 1.5, "learning_rate": 7.532918207173899e-05, "loss": 0.0105, "step": 138550 }, { "epoch": 1.5, "learning_rate": 7.531296620613607e-05, "loss": 0.0076, "step": 138560 }, { "epoch": 1.5, "learning_rate": 7.529675034053317e-05, "loss": 0.0074, "step": 138570 }, { "epoch": 1.5, "learning_rate": 7.528053447493025e-05, "loss": 0.008, "step": 138580 }, { "epoch": 1.5, "learning_rate": 7.526431860932736e-05, "loss": 0.0094, "step": 138590 }, { "epoch": 1.5, "learning_rate": 7.524810274372445e-05, "loss": 0.0083, "step": 138600 }, { "epoch": 1.5, "learning_rate": 7.523188687812155e-05, "loss": 0.0073, "step": 138610 }, { "epoch": 1.5, "learning_rate": 7.521567101251864e-05, "loss": 0.0081, "step": 138620 }, { "epoch": 1.5, "learning_rate": 7.519945514691574e-05, "loss": 0.0103, "step": 138630 }, { "epoch": 1.5, "learning_rate": 7.518323928131282e-05, "loss": 0.0078, "step": 138640 }, { "epoch": 1.5, "learning_rate": 7.516702341570993e-05, "loss": 0.0084, "step": 138650 }, { "epoch": 1.5, "learning_rate": 7.515080755010701e-05, "loss": 0.0088, "step": 138660 }, { "epoch": 1.5, "learning_rate": 7.513459168450412e-05, "loss": 0.0077, "step": 138670 }, { "epoch": 1.5, "learning_rate": 7.51183758189012e-05, "loss": 0.0075, "step": 138680 }, { "epoch": 1.5, "learning_rate": 7.51021599532983e-05, "loss": 0.0073, "step": 138690 }, { "epoch": 1.5, "learning_rate": 7.50859440876954e-05, "loss": 0.0085, "step": 138700 }, { "epoch": 1.5, "learning_rate": 7.506972822209249e-05, "loss": 0.0082, "step": 138710 }, { "epoch": 1.5, "learning_rate": 7.505351235648958e-05, "loss": 0.0077, "step": 138720 }, { "epoch": 1.5, "learning_rate": 7.503729649088667e-05, "loss": 0.0075, "step": 138730 }, { "epoch": 1.5, "learning_rate": 7.502108062528376e-05, "loss": 0.0054, "step": 138740 }, { "epoch": 1.5, "learning_rate": 7.500486475968087e-05, "loss": 0.0068, "step": 138750 }, { "epoch": 1.5, "learning_rate": 7.498864889407796e-05, "loss": 0.0118, "step": 138760 }, { "epoch": 1.5, "learning_rate": 7.497243302847506e-05, "loss": 0.0075, "step": 138770 }, { "epoch": 1.5, "learning_rate": 7.495621716287215e-05, "loss": 0.0091, "step": 138780 }, { "epoch": 1.5, "learning_rate": 7.494000129726924e-05, "loss": 0.0067, "step": 138790 }, { "epoch": 1.5, "learning_rate": 7.492378543166633e-05, "loss": 0.0068, "step": 138800 }, { "epoch": 1.5, "learning_rate": 7.490756956606343e-05, "loss": 0.0077, "step": 138810 }, { "epoch": 1.5, "learning_rate": 7.489135370046052e-05, "loss": 0.012, "step": 138820 }, { "epoch": 1.5, "learning_rate": 7.487513783485761e-05, "loss": 0.0065, "step": 138830 }, { "epoch": 1.5, "learning_rate": 7.48589219692547e-05, "loss": 0.0071, "step": 138840 }, { "epoch": 1.5, "learning_rate": 7.484270610365181e-05, "loss": 0.0077, "step": 138850 }, { "epoch": 1.5, "learning_rate": 7.48264902380489e-05, "loss": 0.0075, "step": 138860 }, { "epoch": 1.5, "learning_rate": 7.4810274372446e-05, "loss": 0.0102, "step": 138870 }, { "epoch": 1.5, "learning_rate": 7.479405850684309e-05, "loss": 0.0072, "step": 138880 }, { "epoch": 1.5, "learning_rate": 7.477784264124018e-05, "loss": 0.0069, "step": 138890 }, { "epoch": 1.5, "learning_rate": 7.476162677563728e-05, "loss": 0.0073, "step": 138900 }, { "epoch": 1.5, "learning_rate": 7.474541091003437e-05, "loss": 0.0069, "step": 138910 }, { "epoch": 1.5, "learning_rate": 7.472919504443146e-05, "loss": 0.0089, "step": 138920 }, { "epoch": 1.5, "learning_rate": 7.471297917882855e-05, "loss": 0.009, "step": 138930 }, { "epoch": 1.5, "learning_rate": 7.469676331322565e-05, "loss": 0.0064, "step": 138940 }, { "epoch": 1.5, "learning_rate": 7.468054744762274e-05, "loss": 0.0068, "step": 138950 }, { "epoch": 1.5, "learning_rate": 7.466433158201985e-05, "loss": 0.0078, "step": 138960 }, { "epoch": 1.5, "learning_rate": 7.464811571641694e-05, "loss": 0.008, "step": 138970 }, { "epoch": 1.5, "learning_rate": 7.463189985081403e-05, "loss": 0.0074, "step": 138980 }, { "epoch": 1.5, "learning_rate": 7.461568398521112e-05, "loss": 0.0069, "step": 138990 }, { "epoch": 1.5, "learning_rate": 7.459946811960822e-05, "loss": 0.0074, "step": 139000 }, { "epoch": 1.5, "eval_cer": 0.9215234600972488, "eval_loss": 0.006560348439961672, "eval_runtime": 121.2617, "eval_samples_per_second": 16.493, "eval_steps_per_second": 4.123, "step": 139000 }, { "epoch": 1.5, "learning_rate": 7.458325225400531e-05, "loss": 0.0064, "step": 139010 }, { "epoch": 1.5, "learning_rate": 7.45670363884024e-05, "loss": 0.008, "step": 139020 }, { "epoch": 1.5, "learning_rate": 7.45508205227995e-05, "loss": 0.0058, "step": 139030 }, { "epoch": 1.5, "learning_rate": 7.453460465719659e-05, "loss": 0.0083, "step": 139040 }, { "epoch": 1.5, "learning_rate": 7.451838879159368e-05, "loss": 0.0083, "step": 139050 }, { "epoch": 1.5, "learning_rate": 7.450217292599079e-05, "loss": 0.0074, "step": 139060 }, { "epoch": 1.5, "learning_rate": 7.448595706038788e-05, "loss": 0.008, "step": 139070 }, { "epoch": 1.5, "learning_rate": 7.446974119478497e-05, "loss": 0.008, "step": 139080 }, { "epoch": 1.5, "learning_rate": 7.445352532918206e-05, "loss": 0.0098, "step": 139090 }, { "epoch": 1.5, "learning_rate": 7.443730946357916e-05, "loss": 0.0082, "step": 139100 }, { "epoch": 1.5, "learning_rate": 7.442109359797625e-05, "loss": 0.0074, "step": 139110 }, { "epoch": 1.5, "learning_rate": 7.440487773237334e-05, "loss": 0.0076, "step": 139120 }, { "epoch": 1.5, "learning_rate": 7.438866186677044e-05, "loss": 0.008, "step": 139130 }, { "epoch": 1.5, "learning_rate": 7.437244600116753e-05, "loss": 0.0095, "step": 139140 }, { "epoch": 1.5, "learning_rate": 7.435623013556462e-05, "loss": 0.0076, "step": 139150 }, { "epoch": 1.5, "learning_rate": 7.434001426996171e-05, "loss": 0.0124, "step": 139160 }, { "epoch": 1.5, "learning_rate": 7.432379840435882e-05, "loss": 0.0109, "step": 139170 }, { "epoch": 1.5, "learning_rate": 7.430758253875591e-05, "loss": 0.0076, "step": 139180 }, { "epoch": 1.5, "learning_rate": 7.4291366673153e-05, "loss": 0.0087, "step": 139190 }, { "epoch": 1.5, "learning_rate": 7.42751508075501e-05, "loss": 0.0092, "step": 139200 }, { "epoch": 1.5, "learning_rate": 7.42589349419472e-05, "loss": 0.0092, "step": 139210 }, { "epoch": 1.51, "learning_rate": 7.42427190763443e-05, "loss": 0.0086, "step": 139220 }, { "epoch": 1.51, "learning_rate": 7.422650321074139e-05, "loss": 0.0069, "step": 139230 }, { "epoch": 1.51, "learning_rate": 7.421028734513848e-05, "loss": 0.0101, "step": 139240 }, { "epoch": 1.51, "learning_rate": 7.419407147953558e-05, "loss": 0.0106, "step": 139250 }, { "epoch": 1.51, "learning_rate": 7.417785561393267e-05, "loss": 0.0099, "step": 139260 }, { "epoch": 1.51, "learning_rate": 7.416163974832976e-05, "loss": 0.0084, "step": 139270 }, { "epoch": 1.51, "learning_rate": 7.414542388272685e-05, "loss": 0.008, "step": 139280 }, { "epoch": 1.51, "learning_rate": 7.412920801712395e-05, "loss": 0.0068, "step": 139290 }, { "epoch": 1.51, "learning_rate": 7.411299215152104e-05, "loss": 0.0068, "step": 139300 }, { "epoch": 1.51, "learning_rate": 7.409677628591813e-05, "loss": 0.0072, "step": 139310 }, { "epoch": 1.51, "learning_rate": 7.408056042031524e-05, "loss": 0.0077, "step": 139320 }, { "epoch": 1.51, "learning_rate": 7.406434455471233e-05, "loss": 0.0079, "step": 139330 }, { "epoch": 1.51, "learning_rate": 7.404812868910942e-05, "loss": 0.0084, "step": 139340 }, { "epoch": 1.51, "learning_rate": 7.403191282350652e-05, "loss": 0.0072, "step": 139350 }, { "epoch": 1.51, "learning_rate": 7.401569695790361e-05, "loss": 0.0079, "step": 139360 }, { "epoch": 1.51, "learning_rate": 7.39994810923007e-05, "loss": 0.0061, "step": 139370 }, { "epoch": 1.51, "learning_rate": 7.39832652266978e-05, "loss": 0.0076, "step": 139380 }, { "epoch": 1.51, "learning_rate": 7.396704936109489e-05, "loss": 0.0071, "step": 139390 }, { "epoch": 1.51, "learning_rate": 7.395083349549198e-05, "loss": 0.0066, "step": 139400 }, { "epoch": 1.51, "learning_rate": 7.393461762988907e-05, "loss": 0.006, "step": 139410 }, { "epoch": 1.51, "learning_rate": 7.391840176428617e-05, "loss": 0.008, "step": 139420 }, { "epoch": 1.51, "learning_rate": 7.390218589868327e-05, "loss": 0.0116, "step": 139430 }, { "epoch": 1.51, "learning_rate": 7.388597003308037e-05, "loss": 0.0082, "step": 139440 }, { "epoch": 1.51, "learning_rate": 7.386975416747746e-05, "loss": 0.0067, "step": 139450 }, { "epoch": 1.51, "learning_rate": 7.385353830187455e-05, "loss": 0.0069, "step": 139460 }, { "epoch": 1.51, "learning_rate": 7.383732243627164e-05, "loss": 0.0092, "step": 139470 }, { "epoch": 1.51, "learning_rate": 7.382110657066874e-05, "loss": 0.0087, "step": 139480 }, { "epoch": 1.51, "learning_rate": 7.380489070506583e-05, "loss": 0.0091, "step": 139490 }, { "epoch": 1.51, "learning_rate": 7.378867483946292e-05, "loss": 0.0075, "step": 139500 }, { "epoch": 1.51, "learning_rate": 7.377245897386001e-05, "loss": 0.01, "step": 139510 }, { "epoch": 1.51, "learning_rate": 7.375624310825711e-05, "loss": 0.0071, "step": 139520 }, { "epoch": 1.51, "learning_rate": 7.37400272426542e-05, "loss": 0.0103, "step": 139530 }, { "epoch": 1.51, "learning_rate": 7.37238113770513e-05, "loss": 0.0099, "step": 139540 }, { "epoch": 1.51, "learning_rate": 7.37075955114484e-05, "loss": 0.0088, "step": 139550 }, { "epoch": 1.51, "learning_rate": 7.369137964584549e-05, "loss": 0.009, "step": 139560 }, { "epoch": 1.51, "learning_rate": 7.367516378024258e-05, "loss": 0.0063, "step": 139570 }, { "epoch": 1.51, "learning_rate": 7.365894791463968e-05, "loss": 0.0097, "step": 139580 }, { "epoch": 1.51, "learning_rate": 7.364273204903677e-05, "loss": 0.0067, "step": 139590 }, { "epoch": 1.51, "learning_rate": 7.362651618343386e-05, "loss": 0.0065, "step": 139600 }, { "epoch": 1.51, "learning_rate": 7.361030031783096e-05, "loss": 0.0074, "step": 139610 }, { "epoch": 1.51, "learning_rate": 7.359408445222805e-05, "loss": 0.0095, "step": 139620 }, { "epoch": 1.51, "learning_rate": 7.357786858662514e-05, "loss": 0.0102, "step": 139630 }, { "epoch": 1.51, "learning_rate": 7.356165272102225e-05, "loss": 0.0092, "step": 139640 }, { "epoch": 1.51, "learning_rate": 7.354543685541934e-05, "loss": 0.0089, "step": 139650 }, { "epoch": 1.51, "learning_rate": 7.352922098981643e-05, "loss": 0.0065, "step": 139660 }, { "epoch": 1.51, "learning_rate": 7.351300512421353e-05, "loss": 0.0078, "step": 139670 }, { "epoch": 1.51, "learning_rate": 7.349678925861062e-05, "loss": 0.0082, "step": 139680 }, { "epoch": 1.51, "learning_rate": 7.348057339300771e-05, "loss": 0.0068, "step": 139690 }, { "epoch": 1.51, "learning_rate": 7.34643575274048e-05, "loss": 0.0093, "step": 139700 }, { "epoch": 1.51, "learning_rate": 7.34481416618019e-05, "loss": 0.0077, "step": 139710 }, { "epoch": 1.51, "learning_rate": 7.343192579619899e-05, "loss": 0.009, "step": 139720 }, { "epoch": 1.51, "learning_rate": 7.341570993059608e-05, "loss": 0.0086, "step": 139730 }, { "epoch": 1.51, "learning_rate": 7.339949406499317e-05, "loss": 0.008, "step": 139740 }, { "epoch": 1.51, "learning_rate": 7.338327819939028e-05, "loss": 0.0083, "step": 139750 }, { "epoch": 1.51, "learning_rate": 7.336706233378737e-05, "loss": 0.0067, "step": 139760 }, { "epoch": 1.51, "learning_rate": 7.335084646818447e-05, "loss": 0.0089, "step": 139770 }, { "epoch": 1.51, "learning_rate": 7.333463060258156e-05, "loss": 0.0063, "step": 139780 }, { "epoch": 1.51, "learning_rate": 7.331841473697865e-05, "loss": 0.0098, "step": 139790 }, { "epoch": 1.51, "learning_rate": 7.330219887137574e-05, "loss": 0.0085, "step": 139800 }, { "epoch": 1.51, "learning_rate": 7.328598300577284e-05, "loss": 0.0096, "step": 139810 }, { "epoch": 1.51, "learning_rate": 7.326976714016993e-05, "loss": 0.0079, "step": 139820 }, { "epoch": 1.51, "learning_rate": 7.325355127456702e-05, "loss": 0.007, "step": 139830 }, { "epoch": 1.51, "learning_rate": 7.323733540896412e-05, "loss": 0.0068, "step": 139840 }, { "epoch": 1.51, "learning_rate": 7.322111954336121e-05, "loss": 0.0065, "step": 139850 }, { "epoch": 1.51, "learning_rate": 7.320490367775831e-05, "loss": 0.0098, "step": 139860 }, { "epoch": 1.51, "learning_rate": 7.318868781215541e-05, "loss": 0.008, "step": 139870 }, { "epoch": 1.51, "learning_rate": 7.31724719465525e-05, "loss": 0.0072, "step": 139880 }, { "epoch": 1.51, "learning_rate": 7.315625608094959e-05, "loss": 0.0078, "step": 139890 }, { "epoch": 1.51, "learning_rate": 7.314004021534669e-05, "loss": 0.0101, "step": 139900 }, { "epoch": 1.51, "learning_rate": 7.312382434974379e-05, "loss": 0.0074, "step": 139910 }, { "epoch": 1.51, "learning_rate": 7.310760848414088e-05, "loss": 0.0082, "step": 139920 }, { "epoch": 1.51, "learning_rate": 7.309139261853798e-05, "loss": 0.0114, "step": 139930 }, { "epoch": 1.51, "learning_rate": 7.307517675293507e-05, "loss": 0.0082, "step": 139940 }, { "epoch": 1.51, "learning_rate": 7.305896088733216e-05, "loss": 0.0084, "step": 139950 }, { "epoch": 1.51, "learning_rate": 7.304274502172926e-05, "loss": 0.008, "step": 139960 }, { "epoch": 1.51, "learning_rate": 7.302652915612635e-05, "loss": 0.0081, "step": 139970 }, { "epoch": 1.51, "learning_rate": 7.301031329052344e-05, "loss": 0.0077, "step": 139980 }, { "epoch": 1.51, "learning_rate": 7.299409742492053e-05, "loss": 0.0112, "step": 139990 }, { "epoch": 1.51, "learning_rate": 7.297788155931763e-05, "loss": 0.009, "step": 140000 }, { "epoch": 1.51, "eval_cer": 0.9215503867888964, "eval_loss": 0.006375947035849094, "eval_runtime": 121.158, "eval_samples_per_second": 16.507, "eval_steps_per_second": 4.127, "step": 140000 }, { "epoch": 1.51, "learning_rate": 7.296166569371473e-05, "loss": 0.0093, "step": 140010 }, { "epoch": 1.51, "learning_rate": 7.294544982811183e-05, "loss": 0.0071, "step": 140020 }, { "epoch": 1.51, "learning_rate": 7.292923396250892e-05, "loss": 0.0079, "step": 140030 }, { "epoch": 1.51, "learning_rate": 7.291301809690601e-05, "loss": 0.0084, "step": 140040 }, { "epoch": 1.51, "learning_rate": 7.28968022313031e-05, "loss": 0.0067, "step": 140050 }, { "epoch": 1.51, "learning_rate": 7.28805863657002e-05, "loss": 0.0111, "step": 140060 }, { "epoch": 1.51, "learning_rate": 7.286437050009729e-05, "loss": 0.0074, "step": 140070 }, { "epoch": 1.51, "learning_rate": 7.284815463449438e-05, "loss": 0.0077, "step": 140080 }, { "epoch": 1.51, "learning_rate": 7.283193876889147e-05, "loss": 0.0094, "step": 140090 }, { "epoch": 1.51, "learning_rate": 7.281572290328857e-05, "loss": 0.0067, "step": 140100 }, { "epoch": 1.51, "learning_rate": 7.279950703768566e-05, "loss": 0.0093, "step": 140110 }, { "epoch": 1.51, "learning_rate": 7.278329117208277e-05, "loss": 0.0073, "step": 140120 }, { "epoch": 1.51, "learning_rate": 7.276707530647986e-05, "loss": 0.0068, "step": 140130 }, { "epoch": 1.51, "learning_rate": 7.275085944087695e-05, "loss": 0.0066, "step": 140140 }, { "epoch": 1.52, "learning_rate": 7.273464357527404e-05, "loss": 0.0105, "step": 140150 }, { "epoch": 1.52, "learning_rate": 7.271842770967114e-05, "loss": 0.0084, "step": 140160 }, { "epoch": 1.52, "learning_rate": 7.270221184406823e-05, "loss": 0.0062, "step": 140170 }, { "epoch": 1.52, "learning_rate": 7.268599597846532e-05, "loss": 0.0084, "step": 140180 }, { "epoch": 1.52, "learning_rate": 7.266978011286242e-05, "loss": 0.0064, "step": 140190 }, { "epoch": 1.52, "learning_rate": 7.265356424725951e-05, "loss": 0.0103, "step": 140200 }, { "epoch": 1.52, "learning_rate": 7.26373483816566e-05, "loss": 0.0096, "step": 140210 }, { "epoch": 1.52, "learning_rate": 7.262113251605371e-05, "loss": 0.0063, "step": 140220 }, { "epoch": 1.52, "learning_rate": 7.26049166504508e-05, "loss": 0.0081, "step": 140230 }, { "epoch": 1.52, "learning_rate": 7.258870078484789e-05, "loss": 0.0075, "step": 140240 }, { "epoch": 1.52, "learning_rate": 7.257248491924499e-05, "loss": 0.0094, "step": 140250 }, { "epoch": 1.52, "learning_rate": 7.255626905364208e-05, "loss": 0.0067, "step": 140260 }, { "epoch": 1.52, "learning_rate": 7.254005318803917e-05, "loss": 0.0073, "step": 140270 }, { "epoch": 1.52, "learning_rate": 7.252383732243626e-05, "loss": 0.0087, "step": 140280 }, { "epoch": 1.52, "learning_rate": 7.250762145683336e-05, "loss": 0.007, "step": 140290 }, { "epoch": 1.52, "learning_rate": 7.249140559123045e-05, "loss": 0.0092, "step": 140300 }, { "epoch": 1.52, "learning_rate": 7.247518972562754e-05, "loss": 0.0075, "step": 140310 }, { "epoch": 1.52, "learning_rate": 7.245897386002464e-05, "loss": 0.0069, "step": 140320 }, { "epoch": 1.52, "learning_rate": 7.244275799442174e-05, "loss": 0.0087, "step": 140330 }, { "epoch": 1.52, "learning_rate": 7.242654212881883e-05, "loss": 0.0092, "step": 140340 }, { "epoch": 1.52, "learning_rate": 7.241032626321593e-05, "loss": 0.0096, "step": 140350 }, { "epoch": 1.52, "learning_rate": 7.239411039761302e-05, "loss": 0.0064, "step": 140360 }, { "epoch": 1.52, "learning_rate": 7.237789453201011e-05, "loss": 0.0086, "step": 140370 }, { "epoch": 1.52, "learning_rate": 7.23616786664072e-05, "loss": 0.0077, "step": 140380 }, { "epoch": 1.52, "learning_rate": 7.23454628008043e-05, "loss": 0.008, "step": 140390 }, { "epoch": 1.52, "learning_rate": 7.232924693520139e-05, "loss": 0.0086, "step": 140400 }, { "epoch": 1.52, "learning_rate": 7.231303106959848e-05, "loss": 0.0117, "step": 140410 }, { "epoch": 1.52, "learning_rate": 7.229681520399558e-05, "loss": 0.0085, "step": 140420 }, { "epoch": 1.52, "learning_rate": 7.228059933839267e-05, "loss": 0.0082, "step": 140430 }, { "epoch": 1.52, "learning_rate": 7.226438347278978e-05, "loss": 0.0074, "step": 140440 }, { "epoch": 1.52, "learning_rate": 7.224816760718687e-05, "loss": 0.0064, "step": 140450 }, { "epoch": 1.52, "learning_rate": 7.223195174158396e-05, "loss": 0.0086, "step": 140460 }, { "epoch": 1.52, "learning_rate": 7.221573587598105e-05, "loss": 0.0081, "step": 140470 }, { "epoch": 1.52, "learning_rate": 7.219952001037815e-05, "loss": 0.0067, "step": 140480 }, { "epoch": 1.52, "learning_rate": 7.218330414477524e-05, "loss": 0.0084, "step": 140490 }, { "epoch": 1.52, "learning_rate": 7.216708827917233e-05, "loss": 0.0094, "step": 140500 }, { "epoch": 1.52, "learning_rate": 7.215087241356942e-05, "loss": 0.0092, "step": 140510 }, { "epoch": 1.52, "learning_rate": 7.213465654796652e-05, "loss": 0.0063, "step": 140520 }, { "epoch": 1.52, "learning_rate": 7.211844068236361e-05, "loss": 0.0069, "step": 140530 }, { "epoch": 1.52, "learning_rate": 7.21022248167607e-05, "loss": 0.0069, "step": 140540 }, { "epoch": 1.52, "learning_rate": 7.208600895115781e-05, "loss": 0.0072, "step": 140550 }, { "epoch": 1.52, "learning_rate": 7.20697930855549e-05, "loss": 0.006, "step": 140560 }, { "epoch": 1.52, "learning_rate": 7.2053577219952e-05, "loss": 0.0069, "step": 140570 }, { "epoch": 1.52, "learning_rate": 7.203736135434909e-05, "loss": 0.0079, "step": 140580 }, { "epoch": 1.52, "learning_rate": 7.202114548874618e-05, "loss": 0.0071, "step": 140590 }, { "epoch": 1.52, "learning_rate": 7.200492962314327e-05, "loss": 0.0069, "step": 140600 }, { "epoch": 1.52, "learning_rate": 7.198871375754037e-05, "loss": 0.0082, "step": 140610 }, { "epoch": 1.52, "learning_rate": 7.197249789193746e-05, "loss": 0.0082, "step": 140620 }, { "epoch": 1.52, "learning_rate": 7.195628202633456e-05, "loss": 0.006, "step": 140630 }, { "epoch": 1.52, "learning_rate": 7.194006616073166e-05, "loss": 0.0092, "step": 140640 }, { "epoch": 1.52, "learning_rate": 7.192385029512875e-05, "loss": 0.0053, "step": 140650 }, { "epoch": 1.52, "learning_rate": 7.190763442952584e-05, "loss": 0.0084, "step": 140660 }, { "epoch": 1.52, "learning_rate": 7.189141856392294e-05, "loss": 0.0084, "step": 140670 }, { "epoch": 1.52, "learning_rate": 7.187520269832003e-05, "loss": 0.0071, "step": 140680 }, { "epoch": 1.52, "learning_rate": 7.185898683271713e-05, "loss": 0.0074, "step": 140690 }, { "epoch": 1.52, "learning_rate": 7.184277096711423e-05, "loss": 0.008, "step": 140700 }, { "epoch": 1.52, "learning_rate": 7.182655510151132e-05, "loss": 0.0065, "step": 140710 }, { "epoch": 1.52, "learning_rate": 7.181033923590841e-05, "loss": 0.0087, "step": 140720 }, { "epoch": 1.52, "learning_rate": 7.17941233703055e-05, "loss": 0.0083, "step": 140730 }, { "epoch": 1.52, "learning_rate": 7.17779075047026e-05, "loss": 0.01, "step": 140740 }, { "epoch": 1.52, "learning_rate": 7.176169163909969e-05, "loss": 0.0073, "step": 140750 }, { "epoch": 1.52, "learning_rate": 7.174547577349678e-05, "loss": 0.007, "step": 140760 }, { "epoch": 1.52, "learning_rate": 7.172925990789388e-05, "loss": 0.0073, "step": 140770 }, { "epoch": 1.52, "learning_rate": 7.171304404229097e-05, "loss": 0.0119, "step": 140780 }, { "epoch": 1.52, "learning_rate": 7.169682817668806e-05, "loss": 0.0071, "step": 140790 }, { "epoch": 1.52, "learning_rate": 7.168061231108517e-05, "loss": 0.0069, "step": 140800 }, { "epoch": 1.52, "learning_rate": 7.166439644548226e-05, "loss": 0.0069, "step": 140810 }, { "epoch": 1.52, "learning_rate": 7.164818057987935e-05, "loss": 0.0089, "step": 140820 }, { "epoch": 1.52, "learning_rate": 7.163196471427645e-05, "loss": 0.0088, "step": 140830 }, { "epoch": 1.52, "learning_rate": 7.161574884867354e-05, "loss": 0.0075, "step": 140840 }, { "epoch": 1.52, "learning_rate": 7.159953298307063e-05, "loss": 0.0082, "step": 140850 }, { "epoch": 1.52, "learning_rate": 7.158331711746772e-05, "loss": 0.0079, "step": 140860 }, { "epoch": 1.52, "learning_rate": 7.156710125186482e-05, "loss": 0.0071, "step": 140870 }, { "epoch": 1.52, "learning_rate": 7.155088538626191e-05, "loss": 0.0103, "step": 140880 }, { "epoch": 1.52, "learning_rate": 7.1534669520659e-05, "loss": 0.0053, "step": 140890 }, { "epoch": 1.52, "learning_rate": 7.15184536550561e-05, "loss": 0.0094, "step": 140900 }, { "epoch": 1.52, "learning_rate": 7.15022377894532e-05, "loss": 0.0086, "step": 140910 }, { "epoch": 1.52, "learning_rate": 7.14860219238503e-05, "loss": 0.0079, "step": 140920 }, { "epoch": 1.52, "learning_rate": 7.146980605824739e-05, "loss": 0.0064, "step": 140930 }, { "epoch": 1.52, "learning_rate": 7.145359019264448e-05, "loss": 0.0088, "step": 140940 }, { "epoch": 1.52, "learning_rate": 7.143737432704157e-05, "loss": 0.0066, "step": 140950 }, { "epoch": 1.52, "learning_rate": 7.142115846143867e-05, "loss": 0.0069, "step": 140960 }, { "epoch": 1.52, "learning_rate": 7.140494259583576e-05, "loss": 0.0088, "step": 140970 }, { "epoch": 1.52, "learning_rate": 7.138872673023285e-05, "loss": 0.0067, "step": 140980 }, { "epoch": 1.52, "learning_rate": 7.137251086462994e-05, "loss": 0.0082, "step": 140990 }, { "epoch": 1.52, "learning_rate": 7.135629499902704e-05, "loss": 0.0062, "step": 141000 }, { "epoch": 1.52, "eval_cer": 0.9215347519356817, "eval_loss": 0.006414701230823994, "eval_runtime": 121.2563, "eval_samples_per_second": 16.494, "eval_steps_per_second": 4.123, "step": 141000 }, { "epoch": 1.52, "learning_rate": 7.134007913342413e-05, "loss": 0.0071, "step": 141010 }, { "epoch": 1.52, "learning_rate": 7.132386326782124e-05, "loss": 0.0075, "step": 141020 }, { "epoch": 1.52, "learning_rate": 7.130764740221833e-05, "loss": 0.0101, "step": 141030 }, { "epoch": 1.52, "learning_rate": 7.129143153661542e-05, "loss": 0.0109, "step": 141040 }, { "epoch": 1.52, "learning_rate": 7.127521567101251e-05, "loss": 0.009, "step": 141050 }, { "epoch": 1.52, "learning_rate": 7.12589998054096e-05, "loss": 0.0088, "step": 141060 }, { "epoch": 1.53, "learning_rate": 7.12427839398067e-05, "loss": 0.0069, "step": 141070 }, { "epoch": 1.53, "learning_rate": 7.122656807420379e-05, "loss": 0.0059, "step": 141080 }, { "epoch": 1.53, "learning_rate": 7.121035220860088e-05, "loss": 0.0065, "step": 141090 }, { "epoch": 1.53, "learning_rate": 7.119413634299798e-05, "loss": 0.0091, "step": 141100 }, { "epoch": 1.53, "learning_rate": 7.117792047739507e-05, "loss": 0.0109, "step": 141110 }, { "epoch": 1.53, "learning_rate": 7.116170461179216e-05, "loss": 0.0082, "step": 141120 }, { "epoch": 1.53, "learning_rate": 7.114548874618927e-05, "loss": 0.0066, "step": 141130 }, { "epoch": 1.53, "learning_rate": 7.112927288058636e-05, "loss": 0.0075, "step": 141140 }, { "epoch": 1.53, "learning_rate": 7.111305701498345e-05, "loss": 0.0088, "step": 141150 }, { "epoch": 1.53, "learning_rate": 7.109684114938055e-05, "loss": 0.008, "step": 141160 }, { "epoch": 1.53, "learning_rate": 7.108062528377764e-05, "loss": 0.0082, "step": 141170 }, { "epoch": 1.53, "learning_rate": 7.106440941817473e-05, "loss": 0.0072, "step": 141180 }, { "epoch": 1.53, "learning_rate": 7.104819355257183e-05, "loss": 0.0079, "step": 141190 }, { "epoch": 1.53, "learning_rate": 7.103197768696892e-05, "loss": 0.0084, "step": 141200 }, { "epoch": 1.53, "learning_rate": 7.101576182136601e-05, "loss": 0.0066, "step": 141210 }, { "epoch": 1.53, "learning_rate": 7.09995459557631e-05, "loss": 0.0072, "step": 141220 }, { "epoch": 1.53, "learning_rate": 7.098333009016021e-05, "loss": 0.0069, "step": 141230 }, { "epoch": 1.53, "learning_rate": 7.09671142245573e-05, "loss": 0.0087, "step": 141240 }, { "epoch": 1.53, "learning_rate": 7.09508983589544e-05, "loss": 0.008, "step": 141250 }, { "epoch": 1.53, "learning_rate": 7.093468249335149e-05, "loss": 0.0055, "step": 141260 }, { "epoch": 1.53, "learning_rate": 7.091846662774858e-05, "loss": 0.0062, "step": 141270 }, { "epoch": 1.53, "learning_rate": 7.090225076214567e-05, "loss": 0.0066, "step": 141280 }, { "epoch": 1.53, "learning_rate": 7.088603489654277e-05, "loss": 0.0068, "step": 141290 }, { "epoch": 1.53, "learning_rate": 7.086981903093986e-05, "loss": 0.0078, "step": 141300 }, { "epoch": 1.53, "learning_rate": 7.085360316533695e-05, "loss": 0.0054, "step": 141310 }, { "epoch": 1.53, "learning_rate": 7.083738729973404e-05, "loss": 0.007, "step": 141320 }, { "epoch": 1.53, "learning_rate": 7.082117143413114e-05, "loss": 0.0078, "step": 141330 }, { "epoch": 1.53, "learning_rate": 7.080495556852824e-05, "loss": 0.0085, "step": 141340 }, { "epoch": 1.53, "learning_rate": 7.078873970292534e-05, "loss": 0.0065, "step": 141350 }, { "epoch": 1.53, "learning_rate": 7.077252383732243e-05, "loss": 0.0071, "step": 141360 }, { "epoch": 1.53, "learning_rate": 7.075630797171952e-05, "loss": 0.0068, "step": 141370 }, { "epoch": 1.53, "learning_rate": 7.074009210611663e-05, "loss": 0.007, "step": 141380 }, { "epoch": 1.53, "learning_rate": 7.072387624051372e-05, "loss": 0.0075, "step": 141390 }, { "epoch": 1.53, "learning_rate": 7.070766037491081e-05, "loss": 0.0059, "step": 141400 }, { "epoch": 1.53, "learning_rate": 7.06914445093079e-05, "loss": 0.0063, "step": 141410 }, { "epoch": 1.53, "learning_rate": 7.0675228643705e-05, "loss": 0.0093, "step": 141420 }, { "epoch": 1.53, "learning_rate": 7.065901277810209e-05, "loss": 0.007, "step": 141430 }, { "epoch": 1.53, "learning_rate": 7.064279691249918e-05, "loss": 0.0084, "step": 141440 }, { "epoch": 1.53, "learning_rate": 7.062658104689628e-05, "loss": 0.0088, "step": 141450 }, { "epoch": 1.53, "learning_rate": 7.061036518129337e-05, "loss": 0.0067, "step": 141460 }, { "epoch": 1.53, "learning_rate": 7.059414931569046e-05, "loss": 0.0084, "step": 141470 }, { "epoch": 1.53, "learning_rate": 7.057793345008756e-05, "loss": 0.0087, "step": 141480 }, { "epoch": 1.53, "learning_rate": 7.056171758448466e-05, "loss": 0.0072, "step": 141490 }, { "epoch": 1.53, "learning_rate": 7.054550171888175e-05, "loss": 0.008, "step": 141500 }, { "epoch": 1.53, "learning_rate": 7.052928585327885e-05, "loss": 0.0076, "step": 141510 }, { "epoch": 1.53, "learning_rate": 7.051306998767594e-05, "loss": 0.0101, "step": 141520 }, { "epoch": 1.53, "learning_rate": 7.049685412207303e-05, "loss": 0.0061, "step": 141530 }, { "epoch": 1.53, "learning_rate": 7.048063825647013e-05, "loss": 0.0066, "step": 141540 }, { "epoch": 1.53, "learning_rate": 7.046442239086722e-05, "loss": 0.0071, "step": 141550 }, { "epoch": 1.53, "learning_rate": 7.044820652526431e-05, "loss": 0.0089, "step": 141560 }, { "epoch": 1.53, "learning_rate": 7.04319906596614e-05, "loss": 0.0078, "step": 141570 }, { "epoch": 1.53, "learning_rate": 7.04157747940585e-05, "loss": 0.0087, "step": 141580 }, { "epoch": 1.53, "learning_rate": 7.039955892845559e-05, "loss": 0.0057, "step": 141590 }, { "epoch": 1.53, "learning_rate": 7.03833430628527e-05, "loss": 0.0082, "step": 141600 }, { "epoch": 1.53, "learning_rate": 7.036712719724979e-05, "loss": 0.008, "step": 141610 }, { "epoch": 1.53, "learning_rate": 7.035091133164688e-05, "loss": 0.0063, "step": 141620 }, { "epoch": 1.53, "learning_rate": 7.033469546604397e-05, "loss": 0.0066, "step": 141630 }, { "epoch": 1.53, "learning_rate": 7.031847960044107e-05, "loss": 0.0068, "step": 141640 }, { "epoch": 1.53, "learning_rate": 7.030226373483816e-05, "loss": 0.0123, "step": 141650 }, { "epoch": 1.53, "learning_rate": 7.028604786923525e-05, "loss": 0.0061, "step": 141660 }, { "epoch": 1.53, "learning_rate": 7.026983200363235e-05, "loss": 0.0059, "step": 141670 }, { "epoch": 1.53, "learning_rate": 7.025361613802944e-05, "loss": 0.0074, "step": 141680 }, { "epoch": 1.53, "learning_rate": 7.023740027242653e-05, "loss": 0.0074, "step": 141690 }, { "epoch": 1.53, "learning_rate": 7.022118440682362e-05, "loss": 0.0067, "step": 141700 }, { "epoch": 1.53, "learning_rate": 7.020496854122073e-05, "loss": 0.0086, "step": 141710 }, { "epoch": 1.53, "learning_rate": 7.018875267561782e-05, "loss": 0.0076, "step": 141720 }, { "epoch": 1.53, "learning_rate": 7.017253681001492e-05, "loss": 0.0087, "step": 141730 }, { "epoch": 1.53, "learning_rate": 7.015632094441201e-05, "loss": 0.0078, "step": 141740 }, { "epoch": 1.53, "learning_rate": 7.01401050788091e-05, "loss": 0.0094, "step": 141750 }, { "epoch": 1.53, "learning_rate": 7.01238892132062e-05, "loss": 0.0074, "step": 141760 }, { "epoch": 1.53, "learning_rate": 7.010767334760329e-05, "loss": 0.0064, "step": 141770 }, { "epoch": 1.53, "learning_rate": 7.009145748200038e-05, "loss": 0.0089, "step": 141780 }, { "epoch": 1.53, "learning_rate": 7.007524161639747e-05, "loss": 0.0073, "step": 141790 }, { "epoch": 1.53, "learning_rate": 7.005902575079456e-05, "loss": 0.0067, "step": 141800 }, { "epoch": 1.53, "learning_rate": 7.004280988519167e-05, "loss": 0.0084, "step": 141810 }, { "epoch": 1.53, "learning_rate": 7.002659401958876e-05, "loss": 0.0099, "step": 141820 }, { "epoch": 1.53, "learning_rate": 7.001037815398586e-05, "loss": 0.0088, "step": 141830 }, { "epoch": 1.53, "learning_rate": 6.999416228838295e-05, "loss": 0.0067, "step": 141840 }, { "epoch": 1.53, "learning_rate": 6.997794642278004e-05, "loss": 0.0071, "step": 141850 }, { "epoch": 1.53, "learning_rate": 6.996173055717713e-05, "loss": 0.0113, "step": 141860 }, { "epoch": 1.53, "learning_rate": 6.994551469157423e-05, "loss": 0.0069, "step": 141870 }, { "epoch": 1.53, "learning_rate": 6.992929882597132e-05, "loss": 0.009, "step": 141880 }, { "epoch": 1.53, "learning_rate": 6.991308296036841e-05, "loss": 0.0077, "step": 141890 }, { "epoch": 1.53, "learning_rate": 6.98968670947655e-05, "loss": 0.007, "step": 141900 }, { "epoch": 1.53, "learning_rate": 6.98806512291626e-05, "loss": 0.007, "step": 141910 }, { "epoch": 1.53, "learning_rate": 6.98644353635597e-05, "loss": 0.0065, "step": 141920 }, { "epoch": 1.53, "learning_rate": 6.98482194979568e-05, "loss": 0.0066, "step": 141930 }, { "epoch": 1.53, "learning_rate": 6.983200363235389e-05, "loss": 0.0079, "step": 141940 }, { "epoch": 1.53, "learning_rate": 6.981578776675098e-05, "loss": 0.0062, "step": 141950 }, { "epoch": 1.53, "learning_rate": 6.979957190114808e-05, "loss": 0.0104, "step": 141960 }, { "epoch": 1.53, "learning_rate": 6.978335603554517e-05, "loss": 0.0097, "step": 141970 }, { "epoch": 1.53, "learning_rate": 6.976714016994226e-05, "loss": 0.0064, "step": 141980 }, { "epoch": 1.53, "learning_rate": 6.975092430433935e-05, "loss": 0.0088, "step": 141990 }, { "epoch": 1.54, "learning_rate": 6.973470843873645e-05, "loss": 0.007, "step": 142000 }, { "epoch": 1.54, "eval_cer": 0.9215330147297689, "eval_loss": 0.0063419705256819725, "eval_runtime": 121.1571, "eval_samples_per_second": 16.507, "eval_steps_per_second": 4.127, "step": 142000 }, { "epoch": 1.54, "learning_rate": 6.971849257313354e-05, "loss": 0.0088, "step": 142010 }, { "epoch": 1.54, "learning_rate": 6.970227670753063e-05, "loss": 0.0063, "step": 142020 }, { "epoch": 1.54, "learning_rate": 6.968606084192774e-05, "loss": 0.0055, "step": 142030 }, { "epoch": 1.54, "learning_rate": 6.966984497632483e-05, "loss": 0.0067, "step": 142040 }, { "epoch": 1.54, "learning_rate": 6.965362911072192e-05, "loss": 0.0067, "step": 142050 }, { "epoch": 1.54, "learning_rate": 6.963741324511902e-05, "loss": 0.0087, "step": 142060 }, { "epoch": 1.54, "learning_rate": 6.962119737951612e-05, "loss": 0.0097, "step": 142070 }, { "epoch": 1.54, "learning_rate": 6.960498151391322e-05, "loss": 0.0084, "step": 142080 }, { "epoch": 1.54, "learning_rate": 6.958876564831031e-05, "loss": 0.0089, "step": 142090 }, { "epoch": 1.54, "learning_rate": 6.95725497827074e-05, "loss": 0.0064, "step": 142100 }, { "epoch": 1.54, "learning_rate": 6.95563339171045e-05, "loss": 0.0076, "step": 142110 }, { "epoch": 1.54, "learning_rate": 6.954011805150159e-05, "loss": 0.007, "step": 142120 }, { "epoch": 1.54, "learning_rate": 6.952390218589868e-05, "loss": 0.0079, "step": 142130 }, { "epoch": 1.54, "learning_rate": 6.950768632029577e-05, "loss": 0.0077, "step": 142140 }, { "epoch": 1.54, "learning_rate": 6.949147045469286e-05, "loss": 0.008, "step": 142150 }, { "epoch": 1.54, "learning_rate": 6.947525458908996e-05, "loss": 0.0083, "step": 142160 }, { "epoch": 1.54, "learning_rate": 6.945903872348705e-05, "loss": 0.0085, "step": 142170 }, { "epoch": 1.54, "learning_rate": 6.944282285788416e-05, "loss": 0.0078, "step": 142180 }, { "epoch": 1.54, "learning_rate": 6.942660699228125e-05, "loss": 0.0069, "step": 142190 }, { "epoch": 1.54, "learning_rate": 6.941039112667834e-05, "loss": 0.008, "step": 142200 }, { "epoch": 1.54, "learning_rate": 6.939417526107543e-05, "loss": 0.007, "step": 142210 }, { "epoch": 1.54, "learning_rate": 6.937795939547253e-05, "loss": 0.0067, "step": 142220 }, { "epoch": 1.54, "learning_rate": 6.936174352986962e-05, "loss": 0.0087, "step": 142230 }, { "epoch": 1.54, "learning_rate": 6.934552766426671e-05, "loss": 0.008, "step": 142240 }, { "epoch": 1.54, "learning_rate": 6.93293117986638e-05, "loss": 0.0102, "step": 142250 }, { "epoch": 1.54, "learning_rate": 6.93130959330609e-05, "loss": 0.009, "step": 142260 }, { "epoch": 1.54, "learning_rate": 6.929688006745799e-05, "loss": 0.0075, "step": 142270 }, { "epoch": 1.54, "learning_rate": 6.92806642018551e-05, "loss": 0.0081, "step": 142280 }, { "epoch": 1.54, "learning_rate": 6.926444833625219e-05, "loss": 0.0095, "step": 142290 }, { "epoch": 1.54, "learning_rate": 6.924823247064928e-05, "loss": 0.0101, "step": 142300 }, { "epoch": 1.54, "learning_rate": 6.923201660504638e-05, "loss": 0.008, "step": 142310 }, { "epoch": 1.54, "learning_rate": 6.921580073944347e-05, "loss": 0.0085, "step": 142320 }, { "epoch": 1.54, "learning_rate": 6.919958487384056e-05, "loss": 0.0096, "step": 142330 }, { "epoch": 1.54, "learning_rate": 6.918336900823765e-05, "loss": 0.0058, "step": 142340 }, { "epoch": 1.54, "learning_rate": 6.916715314263475e-05, "loss": 0.0078, "step": 142350 }, { "epoch": 1.54, "learning_rate": 6.915093727703184e-05, "loss": 0.0071, "step": 142360 }, { "epoch": 1.54, "learning_rate": 6.913472141142893e-05, "loss": 0.0082, "step": 142370 }, { "epoch": 1.54, "learning_rate": 6.911850554582602e-05, "loss": 0.0088, "step": 142380 }, { "epoch": 1.54, "learning_rate": 6.910228968022313e-05, "loss": 0.0066, "step": 142390 }, { "epoch": 1.54, "learning_rate": 6.908607381462022e-05, "loss": 0.0109, "step": 142400 }, { "epoch": 1.54, "learning_rate": 6.906985794901732e-05, "loss": 0.0083, "step": 142410 }, { "epoch": 1.54, "learning_rate": 6.905364208341441e-05, "loss": 0.006, "step": 142420 }, { "epoch": 1.54, "learning_rate": 6.90374262178115e-05, "loss": 0.0072, "step": 142430 }, { "epoch": 1.54, "learning_rate": 6.90212103522086e-05, "loss": 0.0084, "step": 142440 }, { "epoch": 1.54, "learning_rate": 6.900499448660569e-05, "loss": 0.0086, "step": 142450 }, { "epoch": 1.54, "learning_rate": 6.898877862100278e-05, "loss": 0.0056, "step": 142460 }, { "epoch": 1.54, "learning_rate": 6.897256275539987e-05, "loss": 0.0069, "step": 142470 }, { "epoch": 1.54, "learning_rate": 6.895634688979697e-05, "loss": 0.0075, "step": 142480 }, { "epoch": 1.54, "learning_rate": 6.894013102419406e-05, "loss": 0.0103, "step": 142490 }, { "epoch": 1.54, "learning_rate": 6.892391515859116e-05, "loss": 0.0106, "step": 142500 }, { "epoch": 1.54, "learning_rate": 6.890769929298826e-05, "loss": 0.0073, "step": 142510 }, { "epoch": 1.54, "learning_rate": 6.889148342738535e-05, "loss": 0.0066, "step": 142520 }, { "epoch": 1.54, "learning_rate": 6.887526756178244e-05, "loss": 0.0078, "step": 142530 }, { "epoch": 1.54, "learning_rate": 6.885905169617954e-05, "loss": 0.0071, "step": 142540 }, { "epoch": 1.54, "learning_rate": 6.884283583057663e-05, "loss": 0.007, "step": 142550 }, { "epoch": 1.54, "learning_rate": 6.882661996497372e-05, "loss": 0.0104, "step": 142560 }, { "epoch": 1.54, "learning_rate": 6.881040409937081e-05, "loss": 0.0084, "step": 142570 }, { "epoch": 1.54, "learning_rate": 6.87941882337679e-05, "loss": 0.0101, "step": 142580 }, { "epoch": 1.54, "learning_rate": 6.8777972368165e-05, "loss": 0.008, "step": 142590 }, { "epoch": 1.54, "learning_rate": 6.876175650256209e-05, "loss": 0.0072, "step": 142600 }, { "epoch": 1.54, "learning_rate": 6.87455406369592e-05, "loss": 0.0062, "step": 142610 }, { "epoch": 1.54, "learning_rate": 6.872932477135629e-05, "loss": 0.0071, "step": 142620 }, { "epoch": 1.54, "learning_rate": 6.871310890575338e-05, "loss": 0.0083, "step": 142630 }, { "epoch": 1.54, "learning_rate": 6.869689304015048e-05, "loss": 0.0074, "step": 142640 }, { "epoch": 1.54, "learning_rate": 6.868067717454757e-05, "loss": 0.0083, "step": 142650 }, { "epoch": 1.54, "learning_rate": 6.866446130894466e-05, "loss": 0.0093, "step": 142660 }, { "epoch": 1.54, "learning_rate": 6.864824544334176e-05, "loss": 0.0077, "step": 142670 }, { "epoch": 1.54, "learning_rate": 6.863202957773885e-05, "loss": 0.0088, "step": 142680 }, { "epoch": 1.54, "learning_rate": 6.861581371213594e-05, "loss": 0.0082, "step": 142690 }, { "epoch": 1.54, "learning_rate": 6.859959784653303e-05, "loss": 0.0116, "step": 142700 }, { "epoch": 1.54, "learning_rate": 6.858338198093013e-05, "loss": 0.0078, "step": 142710 }, { "epoch": 1.54, "learning_rate": 6.856716611532723e-05, "loss": 0.0074, "step": 142720 }, { "epoch": 1.54, "learning_rate": 6.855095024972433e-05, "loss": 0.0075, "step": 142730 }, { "epoch": 1.54, "learning_rate": 6.853473438412142e-05, "loss": 0.0069, "step": 142740 }, { "epoch": 1.54, "learning_rate": 6.851851851851851e-05, "loss": 0.0084, "step": 142750 }, { "epoch": 1.54, "learning_rate": 6.85023026529156e-05, "loss": 0.0073, "step": 142760 }, { "epoch": 1.54, "learning_rate": 6.84860867873127e-05, "loss": 0.0091, "step": 142770 }, { "epoch": 1.54, "learning_rate": 6.846987092170979e-05, "loss": 0.0067, "step": 142780 }, { "epoch": 1.54, "learning_rate": 6.84536550561069e-05, "loss": 0.0067, "step": 142790 }, { "epoch": 1.54, "learning_rate": 6.843743919050399e-05, "loss": 0.0083, "step": 142800 }, { "epoch": 1.54, "learning_rate": 6.842122332490108e-05, "loss": 0.0063, "step": 142810 }, { "epoch": 1.54, "learning_rate": 6.840500745929817e-05, "loss": 0.0073, "step": 142820 }, { "epoch": 1.54, "learning_rate": 6.838879159369527e-05, "loss": 0.0067, "step": 142830 }, { "epoch": 1.54, "learning_rate": 6.837257572809236e-05, "loss": 0.0075, "step": 142840 }, { "epoch": 1.54, "learning_rate": 6.835635986248945e-05, "loss": 0.0083, "step": 142850 }, { "epoch": 1.54, "learning_rate": 6.834014399688656e-05, "loss": 0.0071, "step": 142860 }, { "epoch": 1.54, "learning_rate": 6.832392813128365e-05, "loss": 0.0091, "step": 142870 }, { "epoch": 1.54, "learning_rate": 6.830771226568074e-05, "loss": 0.0071, "step": 142880 }, { "epoch": 1.54, "learning_rate": 6.829149640007784e-05, "loss": 0.0117, "step": 142890 }, { "epoch": 1.54, "learning_rate": 6.827528053447493e-05, "loss": 0.009, "step": 142900 }, { "epoch": 1.54, "learning_rate": 6.825906466887202e-05, "loss": 0.0066, "step": 142910 }, { "epoch": 1.55, "learning_rate": 6.824284880326911e-05, "loss": 0.007, "step": 142920 }, { "epoch": 1.55, "learning_rate": 6.822663293766621e-05, "loss": 0.0082, "step": 142930 }, { "epoch": 1.55, "learning_rate": 6.82104170720633e-05, "loss": 0.011, "step": 142940 }, { "epoch": 1.55, "learning_rate": 6.819420120646039e-05, "loss": 0.0071, "step": 142950 }, { "epoch": 1.55, "learning_rate": 6.817798534085749e-05, "loss": 0.006, "step": 142960 }, { "epoch": 1.55, "learning_rate": 6.816176947525459e-05, "loss": 0.0084, "step": 142970 }, { "epoch": 1.55, "learning_rate": 6.814555360965168e-05, "loss": 0.0073, "step": 142980 }, { "epoch": 1.55, "learning_rate": 6.812933774404878e-05, "loss": 0.0079, "step": 142990 }, { "epoch": 1.55, "learning_rate": 6.811312187844587e-05, "loss": 0.0082, "step": 143000 }, { "epoch": 1.55, "eval_cer": 0.9215269345090743, "eval_loss": 0.00622851075604558, "eval_runtime": 121.148, "eval_samples_per_second": 16.509, "eval_steps_per_second": 4.127, "step": 143000 }, { "epoch": 1.55, "learning_rate": 6.809690601284296e-05, "loss": 0.0068, "step": 143010 }, { "epoch": 1.55, "learning_rate": 6.808069014724006e-05, "loss": 0.0087, "step": 143020 }, { "epoch": 1.55, "learning_rate": 6.806447428163715e-05, "loss": 0.0067, "step": 143030 }, { "epoch": 1.55, "learning_rate": 6.804825841603424e-05, "loss": 0.0078, "step": 143040 }, { "epoch": 1.55, "learning_rate": 6.803204255043133e-05, "loss": 0.0053, "step": 143050 }, { "epoch": 1.55, "learning_rate": 6.801582668482843e-05, "loss": 0.0064, "step": 143060 }, { "epoch": 1.55, "learning_rate": 6.799961081922552e-05, "loss": 0.0106, "step": 143070 }, { "epoch": 1.55, "learning_rate": 6.798339495362263e-05, "loss": 0.0078, "step": 143080 }, { "epoch": 1.55, "learning_rate": 6.796717908801972e-05, "loss": 0.0076, "step": 143090 }, { "epoch": 1.55, "learning_rate": 6.795096322241681e-05, "loss": 0.0075, "step": 143100 }, { "epoch": 1.55, "learning_rate": 6.79347473568139e-05, "loss": 0.0072, "step": 143110 }, { "epoch": 1.55, "learning_rate": 6.7918531491211e-05, "loss": 0.0075, "step": 143120 }, { "epoch": 1.55, "learning_rate": 6.790231562560809e-05, "loss": 0.0077, "step": 143130 }, { "epoch": 1.55, "learning_rate": 6.788609976000518e-05, "loss": 0.0079, "step": 143140 }, { "epoch": 1.55, "learning_rate": 6.786988389440227e-05, "loss": 0.0079, "step": 143150 }, { "epoch": 1.55, "learning_rate": 6.785366802879937e-05, "loss": 0.0089, "step": 143160 }, { "epoch": 1.55, "learning_rate": 6.783745216319646e-05, "loss": 0.0087, "step": 143170 }, { "epoch": 1.55, "learning_rate": 6.782123629759355e-05, "loss": 0.0096, "step": 143180 }, { "epoch": 1.55, "learning_rate": 6.780502043199066e-05, "loss": 0.0071, "step": 143190 }, { "epoch": 1.55, "learning_rate": 6.778880456638775e-05, "loss": 0.0078, "step": 143200 }, { "epoch": 1.55, "learning_rate": 6.777258870078484e-05, "loss": 0.0099, "step": 143210 }, { "epoch": 1.55, "learning_rate": 6.775637283518194e-05, "loss": 0.0077, "step": 143220 }, { "epoch": 1.55, "learning_rate": 6.774015696957903e-05, "loss": 0.007, "step": 143230 }, { "epoch": 1.55, "learning_rate": 6.772394110397612e-05, "loss": 0.0083, "step": 143240 }, { "epoch": 1.55, "learning_rate": 6.770772523837322e-05, "loss": 0.0065, "step": 143250 }, { "epoch": 1.55, "learning_rate": 6.769150937277031e-05, "loss": 0.0073, "step": 143260 }, { "epoch": 1.55, "learning_rate": 6.76752935071674e-05, "loss": 0.0086, "step": 143270 }, { "epoch": 1.55, "learning_rate": 6.76590776415645e-05, "loss": 0.0092, "step": 143280 }, { "epoch": 1.55, "learning_rate": 6.764286177596159e-05, "loss": 0.0082, "step": 143290 }, { "epoch": 1.55, "learning_rate": 6.762664591035869e-05, "loss": 0.0092, "step": 143300 }, { "epoch": 1.55, "learning_rate": 6.761043004475579e-05, "loss": 0.0072, "step": 143310 }, { "epoch": 1.55, "learning_rate": 6.759421417915288e-05, "loss": 0.0088, "step": 143320 }, { "epoch": 1.55, "learning_rate": 6.757799831354997e-05, "loss": 0.0087, "step": 143330 }, { "epoch": 1.55, "learning_rate": 6.756178244794706e-05, "loss": 0.0088, "step": 143340 }, { "epoch": 1.55, "learning_rate": 6.754556658234416e-05, "loss": 0.007, "step": 143350 }, { "epoch": 1.55, "learning_rate": 6.752935071674125e-05, "loss": 0.0085, "step": 143360 }, { "epoch": 1.55, "learning_rate": 6.751313485113834e-05, "loss": 0.0076, "step": 143370 }, { "epoch": 1.55, "learning_rate": 6.749691898553543e-05, "loss": 0.0065, "step": 143380 }, { "epoch": 1.55, "learning_rate": 6.748070311993253e-05, "loss": 0.0085, "step": 143390 }, { "epoch": 1.55, "learning_rate": 6.746448725432963e-05, "loss": 0.0079, "step": 143400 }, { "epoch": 1.55, "learning_rate": 6.744827138872673e-05, "loss": 0.0071, "step": 143410 }, { "epoch": 1.55, "learning_rate": 6.743205552312382e-05, "loss": 0.0094, "step": 143420 }, { "epoch": 1.55, "learning_rate": 6.741583965752091e-05, "loss": 0.0084, "step": 143430 }, { "epoch": 1.55, "learning_rate": 6.7399623791918e-05, "loss": 0.0074, "step": 143440 }, { "epoch": 1.55, "learning_rate": 6.73834079263151e-05, "loss": 0.0084, "step": 143450 }, { "epoch": 1.55, "learning_rate": 6.736719206071219e-05, "loss": 0.0069, "step": 143460 }, { "epoch": 1.55, "learning_rate": 6.735097619510928e-05, "loss": 0.0081, "step": 143470 }, { "epoch": 1.55, "learning_rate": 6.733476032950638e-05, "loss": 0.0076, "step": 143480 }, { "epoch": 1.55, "learning_rate": 6.731854446390347e-05, "loss": 0.0078, "step": 143490 }, { "epoch": 1.55, "learning_rate": 6.730232859830056e-05, "loss": 0.0066, "step": 143500 }, { "epoch": 1.55, "learning_rate": 6.728611273269767e-05, "loss": 0.0081, "step": 143510 }, { "epoch": 1.55, "learning_rate": 6.726989686709476e-05, "loss": 0.0072, "step": 143520 }, { "epoch": 1.55, "learning_rate": 6.725368100149185e-05, "loss": 0.0075, "step": 143530 }, { "epoch": 1.55, "learning_rate": 6.723746513588895e-05, "loss": 0.0055, "step": 143540 }, { "epoch": 1.55, "learning_rate": 6.722124927028605e-05, "loss": 0.0069, "step": 143550 }, { "epoch": 1.55, "learning_rate": 6.720503340468314e-05, "loss": 0.0068, "step": 143560 }, { "epoch": 1.55, "learning_rate": 6.718881753908024e-05, "loss": 0.0069, "step": 143570 }, { "epoch": 1.55, "learning_rate": 6.717260167347733e-05, "loss": 0.0082, "step": 143580 }, { "epoch": 1.55, "learning_rate": 6.715638580787442e-05, "loss": 0.009, "step": 143590 }, { "epoch": 1.55, "learning_rate": 6.714016994227152e-05, "loss": 0.0076, "step": 143600 }, { "epoch": 1.55, "learning_rate": 6.712395407666861e-05, "loss": 0.0081, "step": 143610 }, { "epoch": 1.55, "learning_rate": 6.71077382110657e-05, "loss": 0.0064, "step": 143620 }, { "epoch": 1.55, "learning_rate": 6.70915223454628e-05, "loss": 0.0084, "step": 143630 }, { "epoch": 1.55, "learning_rate": 6.707530647985989e-05, "loss": 0.0067, "step": 143640 }, { "epoch": 1.55, "learning_rate": 6.705909061425698e-05, "loss": 0.0142, "step": 143650 }, { "epoch": 1.55, "learning_rate": 6.704287474865409e-05, "loss": 0.0072, "step": 143660 }, { "epoch": 1.55, "learning_rate": 6.702665888305118e-05, "loss": 0.0069, "step": 143670 }, { "epoch": 1.55, "learning_rate": 6.701044301744827e-05, "loss": 0.0079, "step": 143680 }, { "epoch": 1.55, "learning_rate": 6.699422715184536e-05, "loss": 0.0087, "step": 143690 }, { "epoch": 1.55, "learning_rate": 6.697801128624246e-05, "loss": 0.0072, "step": 143700 }, { "epoch": 1.55, "learning_rate": 6.696179542063955e-05, "loss": 0.0081, "step": 143710 }, { "epoch": 1.55, "learning_rate": 6.694557955503664e-05, "loss": 0.0064, "step": 143720 }, { "epoch": 1.55, "learning_rate": 6.692936368943373e-05, "loss": 0.0072, "step": 143730 }, { "epoch": 1.55, "learning_rate": 6.691314782383083e-05, "loss": 0.0086, "step": 143740 }, { "epoch": 1.55, "learning_rate": 6.689693195822792e-05, "loss": 0.0081, "step": 143750 }, { "epoch": 1.55, "learning_rate": 6.688071609262501e-05, "loss": 0.0084, "step": 143760 }, { "epoch": 1.55, "learning_rate": 6.686450022702212e-05, "loss": 0.007, "step": 143770 }, { "epoch": 1.55, "learning_rate": 6.684828436141921e-05, "loss": 0.0081, "step": 143780 }, { "epoch": 1.55, "learning_rate": 6.68320684958163e-05, "loss": 0.0081, "step": 143790 }, { "epoch": 1.55, "learning_rate": 6.68158526302134e-05, "loss": 0.0089, "step": 143800 }, { "epoch": 1.55, "learning_rate": 6.679963676461049e-05, "loss": 0.0081, "step": 143810 }, { "epoch": 1.55, "learning_rate": 6.678342089900758e-05, "loss": 0.0103, "step": 143820 }, { "epoch": 1.55, "learning_rate": 6.676720503340468e-05, "loss": 0.0075, "step": 143830 }, { "epoch": 1.55, "learning_rate": 6.675098916780177e-05, "loss": 0.0064, "step": 143840 }, { "epoch": 1.56, "learning_rate": 6.673477330219886e-05, "loss": 0.0077, "step": 143850 }, { "epoch": 1.56, "learning_rate": 6.671855743659595e-05, "loss": 0.0097, "step": 143860 }, { "epoch": 1.56, "learning_rate": 6.670234157099306e-05, "loss": 0.0065, "step": 143870 }, { "epoch": 1.56, "learning_rate": 6.668612570539015e-05, "loss": 0.0078, "step": 143880 }, { "epoch": 1.56, "learning_rate": 6.666990983978725e-05, "loss": 0.0071, "step": 143890 }, { "epoch": 1.56, "learning_rate": 6.665369397418434e-05, "loss": 0.0101, "step": 143900 }, { "epoch": 1.56, "learning_rate": 6.663747810858143e-05, "loss": 0.0069, "step": 143910 }, { "epoch": 1.56, "learning_rate": 6.662126224297852e-05, "loss": 0.0067, "step": 143920 }, { "epoch": 1.56, "learning_rate": 6.660504637737562e-05, "loss": 0.0082, "step": 143930 }, { "epoch": 1.56, "learning_rate": 6.658883051177271e-05, "loss": 0.0095, "step": 143940 }, { "epoch": 1.56, "learning_rate": 6.65726146461698e-05, "loss": 0.0062, "step": 143950 }, { "epoch": 1.56, "learning_rate": 6.65563987805669e-05, "loss": 0.0058, "step": 143960 }, { "epoch": 1.56, "learning_rate": 6.654018291496399e-05, "loss": 0.0078, "step": 143970 }, { "epoch": 1.56, "learning_rate": 6.65239670493611e-05, "loss": 0.0081, "step": 143980 }, { "epoch": 1.56, "learning_rate": 6.650775118375819e-05, "loss": 0.0103, "step": 143990 }, { "epoch": 1.56, "learning_rate": 6.649153531815528e-05, "loss": 0.0077, "step": 144000 }, { "epoch": 1.56, "eval_cer": 0.9214974020085575, "eval_loss": 0.006375683005899191, "eval_runtime": 121.1626, "eval_samples_per_second": 16.507, "eval_steps_per_second": 4.127, "step": 144000 }, { "epoch": 1.56, "learning_rate": 6.647531945255237e-05, "loss": 0.0062, "step": 144010 }, { "epoch": 1.56, "learning_rate": 6.645910358694947e-05, "loss": 0.0073, "step": 144020 }, { "epoch": 1.56, "learning_rate": 6.644288772134656e-05, "loss": 0.0083, "step": 144030 }, { "epoch": 1.56, "learning_rate": 6.642667185574365e-05, "loss": 0.0079, "step": 144040 }, { "epoch": 1.56, "learning_rate": 6.641045599014074e-05, "loss": 0.0087, "step": 144050 }, { "epoch": 1.56, "learning_rate": 6.639424012453784e-05, "loss": 0.0067, "step": 144060 }, { "epoch": 1.56, "learning_rate": 6.637802425893493e-05, "loss": 0.0089, "step": 144070 }, { "epoch": 1.56, "learning_rate": 6.636180839333202e-05, "loss": 0.0065, "step": 144080 }, { "epoch": 1.56, "learning_rate": 6.634559252772913e-05, "loss": 0.0072, "step": 144090 }, { "epoch": 1.56, "learning_rate": 6.632937666212622e-05, "loss": 0.0078, "step": 144100 }, { "epoch": 1.56, "learning_rate": 6.631316079652331e-05, "loss": 0.0078, "step": 144110 }, { "epoch": 1.56, "learning_rate": 6.62969449309204e-05, "loss": 0.0111, "step": 144120 }, { "epoch": 1.56, "learning_rate": 6.62807290653175e-05, "loss": 0.0083, "step": 144130 }, { "epoch": 1.56, "learning_rate": 6.626451319971459e-05, "loss": 0.0115, "step": 144140 }, { "epoch": 1.56, "learning_rate": 6.624829733411168e-05, "loss": 0.005, "step": 144150 }, { "epoch": 1.56, "learning_rate": 6.623208146850878e-05, "loss": 0.0087, "step": 144160 }, { "epoch": 1.56, "learning_rate": 6.621586560290587e-05, "loss": 0.0097, "step": 144170 }, { "epoch": 1.56, "learning_rate": 6.619964973730296e-05, "loss": 0.007, "step": 144180 }, { "epoch": 1.56, "learning_rate": 6.618343387170006e-05, "loss": 0.0063, "step": 144190 }, { "epoch": 1.56, "learning_rate": 6.616721800609716e-05, "loss": 0.0078, "step": 144200 }, { "epoch": 1.56, "learning_rate": 6.615100214049425e-05, "loss": 0.0079, "step": 144210 }, { "epoch": 1.56, "learning_rate": 6.613478627489135e-05, "loss": 0.0077, "step": 144220 }, { "epoch": 1.56, "learning_rate": 6.611857040928844e-05, "loss": 0.0074, "step": 144230 }, { "epoch": 1.56, "learning_rate": 6.610235454368555e-05, "loss": 0.0083, "step": 144240 }, { "epoch": 1.56, "learning_rate": 6.608613867808264e-05, "loss": 0.0062, "step": 144250 }, { "epoch": 1.56, "learning_rate": 6.606992281247973e-05, "loss": 0.0077, "step": 144260 }, { "epoch": 1.56, "learning_rate": 6.605370694687682e-05, "loss": 0.0073, "step": 144270 }, { "epoch": 1.56, "learning_rate": 6.603749108127392e-05, "loss": 0.0089, "step": 144280 }, { "epoch": 1.56, "learning_rate": 6.602127521567101e-05, "loss": 0.0075, "step": 144290 }, { "epoch": 1.56, "learning_rate": 6.60050593500681e-05, "loss": 0.0087, "step": 144300 }, { "epoch": 1.56, "learning_rate": 6.59888434844652e-05, "loss": 0.0057, "step": 144310 }, { "epoch": 1.56, "learning_rate": 6.597262761886229e-05, "loss": 0.0071, "step": 144320 }, { "epoch": 1.56, "learning_rate": 6.595641175325938e-05, "loss": 0.0087, "step": 144330 }, { "epoch": 1.56, "learning_rate": 6.594019588765647e-05, "loss": 0.0084, "step": 144340 }, { "epoch": 1.56, "learning_rate": 6.592398002205358e-05, "loss": 0.0061, "step": 144350 }, { "epoch": 1.56, "learning_rate": 6.590776415645067e-05, "loss": 0.0064, "step": 144360 }, { "epoch": 1.56, "learning_rate": 6.589154829084777e-05, "loss": 0.0079, "step": 144370 }, { "epoch": 1.56, "learning_rate": 6.587533242524486e-05, "loss": 0.0073, "step": 144380 }, { "epoch": 1.56, "learning_rate": 6.585911655964195e-05, "loss": 0.0073, "step": 144390 }, { "epoch": 1.56, "learning_rate": 6.584290069403904e-05, "loss": 0.0088, "step": 144400 }, { "epoch": 1.56, "learning_rate": 6.582668482843614e-05, "loss": 0.0085, "step": 144410 }, { "epoch": 1.56, "learning_rate": 6.581046896283323e-05, "loss": 0.0104, "step": 144420 }, { "epoch": 1.56, "learning_rate": 6.579425309723032e-05, "loss": 0.007, "step": 144430 }, { "epoch": 1.56, "learning_rate": 6.577803723162741e-05, "loss": 0.007, "step": 144440 }, { "epoch": 1.56, "learning_rate": 6.576182136602452e-05, "loss": 0.0077, "step": 144450 }, { "epoch": 1.56, "learning_rate": 6.574560550042161e-05, "loss": 0.0111, "step": 144460 }, { "epoch": 1.56, "learning_rate": 6.57293896348187e-05, "loss": 0.0124, "step": 144470 }, { "epoch": 1.56, "learning_rate": 6.57131737692158e-05, "loss": 0.0085, "step": 144480 }, { "epoch": 1.56, "learning_rate": 6.569695790361289e-05, "loss": 0.0079, "step": 144490 }, { "epoch": 1.56, "learning_rate": 6.568074203800998e-05, "loss": 0.0058, "step": 144500 }, { "epoch": 1.56, "learning_rate": 6.566452617240708e-05, "loss": 0.0078, "step": 144510 }, { "epoch": 1.56, "learning_rate": 6.564831030680417e-05, "loss": 0.0066, "step": 144520 }, { "epoch": 1.56, "learning_rate": 6.563209444120126e-05, "loss": 0.0072, "step": 144530 }, { "epoch": 1.56, "learning_rate": 6.561587857559836e-05, "loss": 0.0083, "step": 144540 }, { "epoch": 1.56, "learning_rate": 6.559966270999545e-05, "loss": 0.006, "step": 144550 }, { "epoch": 1.56, "learning_rate": 6.558344684439255e-05, "loss": 0.0069, "step": 144560 }, { "epoch": 1.56, "learning_rate": 6.556723097878965e-05, "loss": 0.008, "step": 144570 }, { "epoch": 1.56, "learning_rate": 6.555101511318674e-05, "loss": 0.009, "step": 144580 }, { "epoch": 1.56, "learning_rate": 6.553479924758383e-05, "loss": 0.0069, "step": 144590 }, { "epoch": 1.56, "learning_rate": 6.551858338198093e-05, "loss": 0.0082, "step": 144600 }, { "epoch": 1.56, "learning_rate": 6.550236751637802e-05, "loss": 0.0065, "step": 144610 }, { "epoch": 1.56, "learning_rate": 6.548615165077511e-05, "loss": 0.0089, "step": 144620 }, { "epoch": 1.56, "learning_rate": 6.54699357851722e-05, "loss": 0.0049, "step": 144630 }, { "epoch": 1.56, "learning_rate": 6.54537199195693e-05, "loss": 0.0072, "step": 144640 }, { "epoch": 1.56, "learning_rate": 6.543750405396639e-05, "loss": 0.0062, "step": 144650 }, { "epoch": 1.56, "learning_rate": 6.542128818836348e-05, "loss": 0.0071, "step": 144660 }, { "epoch": 1.56, "learning_rate": 6.540507232276059e-05, "loss": 0.0079, "step": 144670 }, { "epoch": 1.56, "learning_rate": 6.538885645715768e-05, "loss": 0.0075, "step": 144680 }, { "epoch": 1.56, "learning_rate": 6.537264059155477e-05, "loss": 0.0092, "step": 144690 }, { "epoch": 1.56, "learning_rate": 6.535642472595187e-05, "loss": 0.0076, "step": 144700 }, { "epoch": 1.56, "learning_rate": 6.534020886034896e-05, "loss": 0.0084, "step": 144710 }, { "epoch": 1.56, "learning_rate": 6.532399299474605e-05, "loss": 0.0092, "step": 144720 }, { "epoch": 1.56, "learning_rate": 6.530777712914314e-05, "loss": 0.0069, "step": 144730 }, { "epoch": 1.56, "learning_rate": 6.529156126354024e-05, "loss": 0.0075, "step": 144740 }, { "epoch": 1.56, "learning_rate": 6.527534539793733e-05, "loss": 0.0072, "step": 144750 }, { "epoch": 1.56, "learning_rate": 6.525912953233442e-05, "loss": 0.0058, "step": 144760 }, { "epoch": 1.57, "learning_rate": 6.524291366673152e-05, "loss": 0.0109, "step": 144770 }, { "epoch": 1.57, "learning_rate": 6.522669780112862e-05, "loss": 0.0088, "step": 144780 }, { "epoch": 1.57, "learning_rate": 6.521048193552571e-05, "loss": 0.01, "step": 144790 }, { "epoch": 1.57, "learning_rate": 6.519426606992281e-05, "loss": 0.0068, "step": 144800 }, { "epoch": 1.57, "learning_rate": 6.51780502043199e-05, "loss": 0.0088, "step": 144810 }, { "epoch": 1.57, "learning_rate": 6.516183433871699e-05, "loss": 0.0083, "step": 144820 }, { "epoch": 1.57, "learning_rate": 6.514561847311409e-05, "loss": 0.007, "step": 144830 }, { "epoch": 1.57, "learning_rate": 6.512940260751118e-05, "loss": 0.0082, "step": 144840 }, { "epoch": 1.57, "learning_rate": 6.511318674190827e-05, "loss": 0.0076, "step": 144850 }, { "epoch": 1.57, "learning_rate": 6.509697087630536e-05, "loss": 0.0067, "step": 144860 }, { "epoch": 1.57, "learning_rate": 6.508075501070246e-05, "loss": 0.0101, "step": 144870 }, { "epoch": 1.57, "learning_rate": 6.506453914509955e-05, "loss": 0.0071, "step": 144880 }, { "epoch": 1.57, "learning_rate": 6.504832327949666e-05, "loss": 0.0071, "step": 144890 }, { "epoch": 1.57, "learning_rate": 6.503210741389375e-05, "loss": 0.0087, "step": 144900 }, { "epoch": 1.57, "learning_rate": 6.501589154829084e-05, "loss": 0.0073, "step": 144910 }, { "epoch": 1.57, "learning_rate": 6.499967568268793e-05, "loss": 0.0075, "step": 144920 }, { "epoch": 1.57, "learning_rate": 6.498345981708503e-05, "loss": 0.0085, "step": 144930 }, { "epoch": 1.57, "learning_rate": 6.496724395148213e-05, "loss": 0.0101, "step": 144940 }, { "epoch": 1.57, "learning_rate": 6.495102808587923e-05, "loss": 0.0091, "step": 144950 }, { "epoch": 1.57, "learning_rate": 6.493481222027632e-05, "loss": 0.0085, "step": 144960 }, { "epoch": 1.57, "learning_rate": 6.491859635467341e-05, "loss": 0.0086, "step": 144970 }, { "epoch": 1.57, "learning_rate": 6.49023804890705e-05, "loss": 0.0085, "step": 144980 }, { "epoch": 1.57, "learning_rate": 6.48861646234676e-05, "loss": 0.0101, "step": 144990 }, { "epoch": 1.57, "learning_rate": 6.486994875786469e-05, "loss": 0.0094, "step": 145000 }, { "epoch": 1.57, "eval_cer": 0.9215243287002052, "eval_loss": 0.006177145056426525, "eval_runtime": 121.3378, "eval_samples_per_second": 16.483, "eval_steps_per_second": 4.121, "step": 145000 }, { "epoch": 1.57, "learning_rate": 6.485373289226178e-05, "loss": 0.0086, "step": 145010 }, { "epoch": 1.57, "learning_rate": 6.483751702665887e-05, "loss": 0.0069, "step": 145020 }, { "epoch": 1.57, "learning_rate": 6.482130116105598e-05, "loss": 0.0105, "step": 145030 }, { "epoch": 1.57, "learning_rate": 6.480508529545307e-05, "loss": 0.0079, "step": 145040 }, { "epoch": 1.57, "learning_rate": 6.478886942985017e-05, "loss": 0.0086, "step": 145050 }, { "epoch": 1.57, "learning_rate": 6.477265356424726e-05, "loss": 0.0079, "step": 145060 }, { "epoch": 1.57, "learning_rate": 6.475643769864435e-05, "loss": 0.0074, "step": 145070 }, { "epoch": 1.57, "learning_rate": 6.474022183304144e-05, "loss": 0.0062, "step": 145080 }, { "epoch": 1.57, "learning_rate": 6.472400596743854e-05, "loss": 0.0071, "step": 145090 }, { "epoch": 1.57, "learning_rate": 6.470779010183563e-05, "loss": 0.0075, "step": 145100 }, { "epoch": 1.57, "learning_rate": 6.469157423623272e-05, "loss": 0.0079, "step": 145110 }, { "epoch": 1.57, "learning_rate": 6.467535837062982e-05, "loss": 0.0083, "step": 145120 }, { "epoch": 1.57, "learning_rate": 6.465914250502691e-05, "loss": 0.0068, "step": 145130 }, { "epoch": 1.57, "learning_rate": 6.464292663942402e-05, "loss": 0.008, "step": 145140 }, { "epoch": 1.57, "learning_rate": 6.462671077382111e-05, "loss": 0.0098, "step": 145150 }, { "epoch": 1.57, "learning_rate": 6.46104949082182e-05, "loss": 0.0088, "step": 145160 }, { "epoch": 1.57, "learning_rate": 6.45942790426153e-05, "loss": 0.0074, "step": 145170 }, { "epoch": 1.57, "learning_rate": 6.457806317701239e-05, "loss": 0.0084, "step": 145180 }, { "epoch": 1.57, "learning_rate": 6.456184731140948e-05, "loss": 0.0065, "step": 145190 }, { "epoch": 1.57, "learning_rate": 6.454563144580657e-05, "loss": 0.0077, "step": 145200 }, { "epoch": 1.57, "learning_rate": 6.452941558020366e-05, "loss": 0.0094, "step": 145210 }, { "epoch": 1.57, "learning_rate": 6.451319971460076e-05, "loss": 0.0084, "step": 145220 }, { "epoch": 1.57, "learning_rate": 6.449698384899785e-05, "loss": 0.0051, "step": 145230 }, { "epoch": 1.57, "learning_rate": 6.448076798339494e-05, "loss": 0.0077, "step": 145240 }, { "epoch": 1.57, "learning_rate": 6.446455211779205e-05, "loss": 0.0061, "step": 145250 }, { "epoch": 1.57, "learning_rate": 6.444833625218914e-05, "loss": 0.0085, "step": 145260 }, { "epoch": 1.57, "learning_rate": 6.443212038658623e-05, "loss": 0.0074, "step": 145270 }, { "epoch": 1.57, "learning_rate": 6.441590452098333e-05, "loss": 0.0072, "step": 145280 }, { "epoch": 1.57, "learning_rate": 6.439968865538042e-05, "loss": 0.0064, "step": 145290 }, { "epoch": 1.57, "learning_rate": 6.438347278977751e-05, "loss": 0.0085, "step": 145300 }, { "epoch": 1.57, "learning_rate": 6.43672569241746e-05, "loss": 0.0074, "step": 145310 }, { "epoch": 1.57, "learning_rate": 6.43510410585717e-05, "loss": 0.0098, "step": 145320 }, { "epoch": 1.57, "learning_rate": 6.433482519296879e-05, "loss": 0.0061, "step": 145330 }, { "epoch": 1.57, "learning_rate": 6.431860932736588e-05, "loss": 0.0077, "step": 145340 }, { "epoch": 1.57, "learning_rate": 6.430239346176298e-05, "loss": 0.0082, "step": 145350 }, { "epoch": 1.57, "learning_rate": 6.428617759616008e-05, "loss": 0.008, "step": 145360 }, { "epoch": 1.57, "learning_rate": 6.426996173055718e-05, "loss": 0.0083, "step": 145370 }, { "epoch": 1.57, "learning_rate": 6.425374586495427e-05, "loss": 0.0102, "step": 145380 }, { "epoch": 1.57, "learning_rate": 6.423752999935136e-05, "loss": 0.0088, "step": 145390 }, { "epoch": 1.57, "learning_rate": 6.422131413374845e-05, "loss": 0.0059, "step": 145400 }, { "epoch": 1.57, "learning_rate": 6.420509826814555e-05, "loss": 0.0076, "step": 145410 }, { "epoch": 1.57, "learning_rate": 6.418888240254264e-05, "loss": 0.009, "step": 145420 }, { "epoch": 1.57, "learning_rate": 6.417266653693973e-05, "loss": 0.0057, "step": 145430 }, { "epoch": 1.57, "learning_rate": 6.415645067133682e-05, "loss": 0.0057, "step": 145440 }, { "epoch": 1.57, "learning_rate": 6.414023480573392e-05, "loss": 0.0081, "step": 145450 }, { "epoch": 1.57, "learning_rate": 6.412401894013102e-05, "loss": 0.0075, "step": 145460 }, { "epoch": 1.57, "learning_rate": 6.410780307452812e-05, "loss": 0.0082, "step": 145470 }, { "epoch": 1.57, "learning_rate": 6.409158720892521e-05, "loss": 0.0088, "step": 145480 }, { "epoch": 1.57, "learning_rate": 6.40753713433223e-05, "loss": 0.0078, "step": 145490 }, { "epoch": 1.57, "learning_rate": 6.40591554777194e-05, "loss": 0.0081, "step": 145500 }, { "epoch": 1.57, "learning_rate": 6.404293961211649e-05, "loss": 0.0062, "step": 145510 }, { "epoch": 1.57, "learning_rate": 6.402672374651358e-05, "loss": 0.0076, "step": 145520 }, { "epoch": 1.57, "learning_rate": 6.401050788091067e-05, "loss": 0.0074, "step": 145530 }, { "epoch": 1.57, "learning_rate": 6.399429201530777e-05, "loss": 0.0079, "step": 145540 }, { "epoch": 1.57, "learning_rate": 6.397807614970486e-05, "loss": 0.0143, "step": 145550 }, { "epoch": 1.57, "learning_rate": 6.396186028410195e-05, "loss": 0.0075, "step": 145560 }, { "epoch": 1.57, "learning_rate": 6.394564441849906e-05, "loss": 0.007, "step": 145570 }, { "epoch": 1.57, "learning_rate": 6.392942855289615e-05, "loss": 0.0066, "step": 145580 }, { "epoch": 1.57, "learning_rate": 6.391321268729324e-05, "loss": 0.0089, "step": 145590 }, { "epoch": 1.57, "learning_rate": 6.389699682169034e-05, "loss": 0.0076, "step": 145600 }, { "epoch": 1.57, "learning_rate": 6.388078095608743e-05, "loss": 0.0065, "step": 145610 }, { "epoch": 1.57, "learning_rate": 6.386456509048452e-05, "loss": 0.0066, "step": 145620 }, { "epoch": 1.57, "learning_rate": 6.384834922488161e-05, "loss": 0.0099, "step": 145630 }, { "epoch": 1.57, "learning_rate": 6.38321333592787e-05, "loss": 0.0063, "step": 145640 }, { "epoch": 1.57, "learning_rate": 6.38159174936758e-05, "loss": 0.0059, "step": 145650 }, { "epoch": 1.57, "learning_rate": 6.37997016280729e-05, "loss": 0.008, "step": 145660 }, { "epoch": 1.57, "learning_rate": 6.378348576247e-05, "loss": 0.0095, "step": 145670 }, { "epoch": 1.57, "learning_rate": 6.376726989686709e-05, "loss": 0.009, "step": 145680 }, { "epoch": 1.57, "learning_rate": 6.375105403126418e-05, "loss": 0.0069, "step": 145690 }, { "epoch": 1.58, "learning_rate": 6.373483816566128e-05, "loss": 0.0076, "step": 145700 }, { "epoch": 1.58, "learning_rate": 6.371862230005837e-05, "loss": 0.0075, "step": 145710 }, { "epoch": 1.58, "learning_rate": 6.370240643445548e-05, "loss": 0.0085, "step": 145720 }, { "epoch": 1.58, "learning_rate": 6.368619056885257e-05, "loss": 0.0087, "step": 145730 }, { "epoch": 1.58, "learning_rate": 6.366997470324966e-05, "loss": 0.0079, "step": 145740 }, { "epoch": 1.58, "learning_rate": 6.365375883764675e-05, "loss": 0.0082, "step": 145750 }, { "epoch": 1.58, "learning_rate": 6.363754297204385e-05, "loss": 0.0079, "step": 145760 }, { "epoch": 1.58, "learning_rate": 6.362132710644094e-05, "loss": 0.0073, "step": 145770 }, { "epoch": 1.58, "learning_rate": 6.360511124083803e-05, "loss": 0.0111, "step": 145780 }, { "epoch": 1.58, "learning_rate": 6.358889537523512e-05, "loss": 0.0088, "step": 145790 }, { "epoch": 1.58, "learning_rate": 6.357267950963222e-05, "loss": 0.0098, "step": 145800 }, { "epoch": 1.58, "learning_rate": 6.355646364402931e-05, "loss": 0.0068, "step": 145810 }, { "epoch": 1.58, "learning_rate": 6.35402477784264e-05, "loss": 0.0096, "step": 145820 }, { "epoch": 1.58, "learning_rate": 6.352403191282351e-05, "loss": 0.0079, "step": 145830 }, { "epoch": 1.58, "learning_rate": 6.35078160472206e-05, "loss": 0.0079, "step": 145840 }, { "epoch": 1.58, "learning_rate": 6.34916001816177e-05, "loss": 0.0076, "step": 145850 }, { "epoch": 1.58, "learning_rate": 6.347538431601479e-05, "loss": 0.0087, "step": 145860 }, { "epoch": 1.58, "learning_rate": 6.345916845041188e-05, "loss": 0.007, "step": 145870 }, { "epoch": 1.58, "learning_rate": 6.344295258480897e-05, "loss": 0.0087, "step": 145880 }, { "epoch": 1.58, "learning_rate": 6.342673671920607e-05, "loss": 0.0082, "step": 145890 }, { "epoch": 1.58, "learning_rate": 6.341052085360316e-05, "loss": 0.0075, "step": 145900 }, { "epoch": 1.58, "learning_rate": 6.339430498800025e-05, "loss": 0.0087, "step": 145910 }, { "epoch": 1.58, "learning_rate": 6.337808912239734e-05, "loss": 0.0085, "step": 145920 }, { "epoch": 1.58, "learning_rate": 6.336187325679444e-05, "loss": 0.0078, "step": 145930 }, { "epoch": 1.58, "learning_rate": 6.334565739119154e-05, "loss": 0.006, "step": 145940 }, { "epoch": 1.58, "learning_rate": 6.332944152558864e-05, "loss": 0.0067, "step": 145950 }, { "epoch": 1.58, "learning_rate": 6.331322565998573e-05, "loss": 0.0107, "step": 145960 }, { "epoch": 1.58, "learning_rate": 6.329700979438282e-05, "loss": 0.0057, "step": 145970 }, { "epoch": 1.58, "learning_rate": 6.328079392877991e-05, "loss": 0.0076, "step": 145980 }, { "epoch": 1.58, "learning_rate": 6.3264578063177e-05, "loss": 0.0088, "step": 145990 }, { "epoch": 1.58, "learning_rate": 6.32483621975741e-05, "loss": 0.0085, "step": 146000 }, { "epoch": 1.58, "eval_cer": 0.921514774067685, "eval_loss": 0.006277143489569426, "eval_runtime": 121.0938, "eval_samples_per_second": 16.516, "eval_steps_per_second": 4.129, "step": 146000 }, { "epoch": 1.58, "learning_rate": 6.323214633197119e-05, "loss": 0.0072, "step": 146010 }, { "epoch": 1.58, "learning_rate": 6.321593046636828e-05, "loss": 0.0079, "step": 146020 }, { "epoch": 1.58, "learning_rate": 6.319971460076538e-05, "loss": 0.0069, "step": 146030 }, { "epoch": 1.58, "learning_rate": 6.318349873516248e-05, "loss": 0.0089, "step": 146040 }, { "epoch": 1.58, "learning_rate": 6.316728286955958e-05, "loss": 0.0076, "step": 146050 }, { "epoch": 1.58, "learning_rate": 6.315106700395667e-05, "loss": 0.0082, "step": 146060 }, { "epoch": 1.58, "learning_rate": 6.313485113835376e-05, "loss": 0.0071, "step": 146070 }, { "epoch": 1.58, "learning_rate": 6.311863527275085e-05, "loss": 0.0104, "step": 146080 }, { "epoch": 1.58, "learning_rate": 6.310241940714795e-05, "loss": 0.0073, "step": 146090 }, { "epoch": 1.58, "learning_rate": 6.308620354154504e-05, "loss": 0.0079, "step": 146100 }, { "epoch": 1.58, "learning_rate": 6.306998767594213e-05, "loss": 0.0109, "step": 146110 }, { "epoch": 1.58, "learning_rate": 6.305377181033923e-05, "loss": 0.0056, "step": 146120 }, { "epoch": 1.58, "learning_rate": 6.303755594473632e-05, "loss": 0.0067, "step": 146130 }, { "epoch": 1.58, "learning_rate": 6.302134007913341e-05, "loss": 0.007, "step": 146140 }, { "epoch": 1.58, "learning_rate": 6.300512421353052e-05, "loss": 0.0078, "step": 146150 }, { "epoch": 1.58, "learning_rate": 6.298890834792761e-05, "loss": 0.0088, "step": 146160 }, { "epoch": 1.58, "learning_rate": 6.29726924823247e-05, "loss": 0.01, "step": 146170 }, { "epoch": 1.58, "learning_rate": 6.29564766167218e-05, "loss": 0.0083, "step": 146180 }, { "epoch": 1.58, "learning_rate": 6.294026075111889e-05, "loss": 0.0069, "step": 146190 }, { "epoch": 1.58, "learning_rate": 6.292404488551598e-05, "loss": 0.0082, "step": 146200 }, { "epoch": 1.58, "learning_rate": 6.290782901991307e-05, "loss": 0.011, "step": 146210 }, { "epoch": 1.58, "learning_rate": 6.289161315431017e-05, "loss": 0.0074, "step": 146220 }, { "epoch": 1.58, "learning_rate": 6.287539728870726e-05, "loss": 0.0105, "step": 146230 }, { "epoch": 1.58, "learning_rate": 6.285918142310435e-05, "loss": 0.0093, "step": 146240 }, { "epoch": 1.58, "learning_rate": 6.284296555750145e-05, "loss": 0.0087, "step": 146250 }, { "epoch": 1.58, "learning_rate": 6.282674969189855e-05, "loss": 0.0083, "step": 146260 }, { "epoch": 1.58, "learning_rate": 6.281053382629564e-05, "loss": 0.0073, "step": 146270 }, { "epoch": 1.58, "learning_rate": 6.279431796069274e-05, "loss": 0.0101, "step": 146280 }, { "epoch": 1.58, "learning_rate": 6.277810209508983e-05, "loss": 0.0086, "step": 146290 }, { "epoch": 1.58, "learning_rate": 6.276188622948692e-05, "loss": 0.0095, "step": 146300 }, { "epoch": 1.58, "learning_rate": 6.274567036388402e-05, "loss": 0.0088, "step": 146310 }, { "epoch": 1.58, "learning_rate": 6.272945449828111e-05, "loss": 0.0073, "step": 146320 }, { "epoch": 1.58, "learning_rate": 6.27132386326782e-05, "loss": 0.0086, "step": 146330 }, { "epoch": 1.58, "learning_rate": 6.26970227670753e-05, "loss": 0.0078, "step": 146340 }, { "epoch": 1.58, "learning_rate": 6.268080690147239e-05, "loss": 0.0071, "step": 146350 }, { "epoch": 1.58, "learning_rate": 6.266459103586948e-05, "loss": 0.008, "step": 146360 }, { "epoch": 1.58, "learning_rate": 6.264837517026659e-05, "loss": 0.0068, "step": 146370 }, { "epoch": 1.58, "learning_rate": 6.263215930466368e-05, "loss": 0.0088, "step": 146380 }, { "epoch": 1.58, "learning_rate": 6.261594343906077e-05, "loss": 0.007, "step": 146390 }, { "epoch": 1.58, "learning_rate": 6.259972757345786e-05, "loss": 0.0075, "step": 146400 }, { "epoch": 1.58, "learning_rate": 6.258351170785497e-05, "loss": 0.0106, "step": 146410 }, { "epoch": 1.58, "learning_rate": 6.256729584225206e-05, "loss": 0.0073, "step": 146420 }, { "epoch": 1.58, "learning_rate": 6.255107997664916e-05, "loss": 0.009, "step": 146430 }, { "epoch": 1.58, "learning_rate": 6.253486411104625e-05, "loss": 0.0081, "step": 146440 }, { "epoch": 1.58, "learning_rate": 6.251864824544334e-05, "loss": 0.0082, "step": 146450 }, { "epoch": 1.58, "learning_rate": 6.250243237984043e-05, "loss": 0.0079, "step": 146460 }, { "epoch": 1.58, "learning_rate": 6.248621651423753e-05, "loss": 0.012, "step": 146470 }, { "epoch": 1.58, "learning_rate": 6.247000064863462e-05, "loss": 0.0069, "step": 146480 }, { "epoch": 1.58, "learning_rate": 6.245378478303171e-05, "loss": 0.0074, "step": 146490 }, { "epoch": 1.58, "learning_rate": 6.24375689174288e-05, "loss": 0.0095, "step": 146500 }, { "epoch": 1.58, "learning_rate": 6.24213530518259e-05, "loss": 0.0061, "step": 146510 }, { "epoch": 1.58, "learning_rate": 6.2405137186223e-05, "loss": 0.0085, "step": 146520 }, { "epoch": 1.58, "learning_rate": 6.23889213206201e-05, "loss": 0.011, "step": 146530 }, { "epoch": 1.58, "learning_rate": 6.237270545501719e-05, "loss": 0.0115, "step": 146540 }, { "epoch": 1.58, "learning_rate": 6.235648958941428e-05, "loss": 0.011, "step": 146550 }, { "epoch": 1.58, "learning_rate": 6.234027372381137e-05, "loss": 0.0076, "step": 146560 }, { "epoch": 1.58, "learning_rate": 6.232405785820847e-05, "loss": 0.0068, "step": 146570 }, { "epoch": 1.58, "learning_rate": 6.230784199260556e-05, "loss": 0.0075, "step": 146580 }, { "epoch": 1.58, "learning_rate": 6.229162612700265e-05, "loss": 0.0063, "step": 146590 }, { "epoch": 1.58, "learning_rate": 6.227541026139975e-05, "loss": 0.0078, "step": 146600 }, { "epoch": 1.58, "learning_rate": 6.225919439579684e-05, "loss": 0.0071, "step": 146610 }, { "epoch": 1.59, "learning_rate": 6.224297853019394e-05, "loss": 0.0087, "step": 146620 }, { "epoch": 1.59, "learning_rate": 6.222676266459104e-05, "loss": 0.0074, "step": 146630 }, { "epoch": 1.59, "learning_rate": 6.221054679898813e-05, "loss": 0.0067, "step": 146640 }, { "epoch": 1.59, "learning_rate": 6.219433093338522e-05, "loss": 0.0064, "step": 146650 }, { "epoch": 1.59, "learning_rate": 6.217811506778232e-05, "loss": 0.0063, "step": 146660 }, { "epoch": 1.59, "learning_rate": 6.216189920217941e-05, "loss": 0.0068, "step": 146670 }, { "epoch": 1.59, "learning_rate": 6.21456833365765e-05, "loss": 0.0061, "step": 146680 }, { "epoch": 1.59, "learning_rate": 6.21294674709736e-05, "loss": 0.0079, "step": 146690 }, { "epoch": 1.59, "learning_rate": 6.211325160537069e-05, "loss": 0.0085, "step": 146700 }, { "epoch": 1.59, "learning_rate": 6.209703573976778e-05, "loss": 0.0085, "step": 146710 }, { "epoch": 1.59, "learning_rate": 6.208081987416487e-05, "loss": 0.0083, "step": 146720 }, { "epoch": 1.59, "learning_rate": 6.206460400856198e-05, "loss": 0.0062, "step": 146730 }, { "epoch": 1.59, "learning_rate": 6.204838814295907e-05, "loss": 0.0085, "step": 146740 }, { "epoch": 1.59, "learning_rate": 6.203217227735616e-05, "loss": 0.0079, "step": 146750 }, { "epoch": 1.59, "learning_rate": 6.201595641175326e-05, "loss": 0.0083, "step": 146760 }, { "epoch": 1.59, "learning_rate": 6.199974054615035e-05, "loss": 0.0077, "step": 146770 }, { "epoch": 1.59, "learning_rate": 6.198352468054744e-05, "loss": 0.0071, "step": 146780 }, { "epoch": 1.59, "learning_rate": 6.196730881494453e-05, "loss": 0.0063, "step": 146790 }, { "epoch": 1.59, "learning_rate": 6.195109294934163e-05, "loss": 0.0085, "step": 146800 }, { "epoch": 1.59, "learning_rate": 6.193487708373872e-05, "loss": 0.0086, "step": 146810 }, { "epoch": 1.59, "learning_rate": 6.191866121813581e-05, "loss": 0.008, "step": 146820 }, { "epoch": 1.59, "learning_rate": 6.19024453525329e-05, "loss": 0.007, "step": 146830 }, { "epoch": 1.59, "learning_rate": 6.188622948693001e-05, "loss": 0.0087, "step": 146840 }, { "epoch": 1.59, "learning_rate": 6.18700136213271e-05, "loss": 0.0078, "step": 146850 }, { "epoch": 1.59, "learning_rate": 6.18537977557242e-05, "loss": 0.0124, "step": 146860 }, { "epoch": 1.59, "learning_rate": 6.183758189012129e-05, "loss": 0.0067, "step": 146870 }, { "epoch": 1.59, "learning_rate": 6.182136602451838e-05, "loss": 0.01, "step": 146880 }, { "epoch": 1.59, "learning_rate": 6.180515015891548e-05, "loss": 0.0067, "step": 146890 }, { "epoch": 1.59, "learning_rate": 6.178893429331257e-05, "loss": 0.008, "step": 146900 }, { "epoch": 1.59, "learning_rate": 6.177271842770966e-05, "loss": 0.0082, "step": 146910 }, { "epoch": 1.59, "learning_rate": 6.175650256210675e-05, "loss": 0.006, "step": 146920 }, { "epoch": 1.59, "learning_rate": 6.174028669650385e-05, "loss": 0.0062, "step": 146930 }, { "epoch": 1.59, "learning_rate": 6.172407083090094e-05, "loss": 0.0076, "step": 146940 }, { "epoch": 1.59, "learning_rate": 6.170785496529805e-05, "loss": 0.0065, "step": 146950 }, { "epoch": 1.59, "learning_rate": 6.169163909969514e-05, "loss": 0.008, "step": 146960 }, { "epoch": 1.59, "learning_rate": 6.167542323409223e-05, "loss": 0.0074, "step": 146970 }, { "epoch": 1.59, "learning_rate": 6.165920736848932e-05, "loss": 0.0064, "step": 146980 }, { "epoch": 1.59, "learning_rate": 6.164299150288642e-05, "loss": 0.0063, "step": 146990 }, { "epoch": 1.59, "learning_rate": 6.162677563728351e-05, "loss": 0.0091, "step": 147000 }, { "epoch": 1.59, "eval_cer": 0.9215234600972488, "eval_loss": 0.006228927057236433, "eval_runtime": 121.1059, "eval_samples_per_second": 16.514, "eval_steps_per_second": 4.129, "step": 147000 }, { "epoch": 1.59, "learning_rate": 6.16105597716806e-05, "loss": 0.0088, "step": 147010 }, { "epoch": 1.59, "learning_rate": 6.15943439060777e-05, "loss": 0.0072, "step": 147020 }, { "epoch": 1.59, "learning_rate": 6.157812804047479e-05, "loss": 0.0072, "step": 147030 }, { "epoch": 1.59, "learning_rate": 6.156191217487188e-05, "loss": 0.0063, "step": 147040 }, { "epoch": 1.59, "learning_rate": 6.154569630926899e-05, "loss": 0.0083, "step": 147050 }, { "epoch": 1.59, "learning_rate": 6.152948044366608e-05, "loss": 0.0062, "step": 147060 }, { "epoch": 1.59, "learning_rate": 6.151326457806317e-05, "loss": 0.0068, "step": 147070 }, { "epoch": 1.59, "learning_rate": 6.149704871246026e-05, "loss": 0.0093, "step": 147080 }, { "epoch": 1.59, "learning_rate": 6.148083284685736e-05, "loss": 0.0057, "step": 147090 }, { "epoch": 1.59, "learning_rate": 6.146461698125446e-05, "loss": 0.005, "step": 147100 }, { "epoch": 1.59, "learning_rate": 6.144840111565156e-05, "loss": 0.0077, "step": 147110 }, { "epoch": 1.59, "learning_rate": 6.143218525004865e-05, "loss": 0.0068, "step": 147120 }, { "epoch": 1.59, "learning_rate": 6.141596938444574e-05, "loss": 0.0068, "step": 147130 }, { "epoch": 1.59, "learning_rate": 6.139975351884283e-05, "loss": 0.0072, "step": 147140 }, { "epoch": 1.59, "learning_rate": 6.138353765323993e-05, "loss": 0.0065, "step": 147150 }, { "epoch": 1.59, "learning_rate": 6.136732178763702e-05, "loss": 0.0069, "step": 147160 }, { "epoch": 1.59, "learning_rate": 6.135110592203411e-05, "loss": 0.0055, "step": 147170 }, { "epoch": 1.59, "learning_rate": 6.13348900564312e-05, "loss": 0.0083, "step": 147180 }, { "epoch": 1.59, "learning_rate": 6.13186741908283e-05, "loss": 0.0106, "step": 147190 }, { "epoch": 1.59, "learning_rate": 6.13024583252254e-05, "loss": 0.0089, "step": 147200 }, { "epoch": 1.59, "learning_rate": 6.12862424596225e-05, "loss": 0.0082, "step": 147210 }, { "epoch": 1.59, "learning_rate": 6.127002659401959e-05, "loss": 0.0097, "step": 147220 }, { "epoch": 1.59, "learning_rate": 6.125381072841668e-05, "loss": 0.0082, "step": 147230 }, { "epoch": 1.59, "learning_rate": 6.123759486281378e-05, "loss": 0.0057, "step": 147240 }, { "epoch": 1.59, "learning_rate": 6.122137899721087e-05, "loss": 0.0073, "step": 147250 }, { "epoch": 1.59, "learning_rate": 6.120516313160796e-05, "loss": 0.007, "step": 147260 }, { "epoch": 1.59, "learning_rate": 6.118894726600505e-05, "loss": 0.0076, "step": 147270 }, { "epoch": 1.59, "learning_rate": 6.117273140040215e-05, "loss": 0.0059, "step": 147280 }, { "epoch": 1.59, "learning_rate": 6.115651553479924e-05, "loss": 0.0065, "step": 147290 }, { "epoch": 1.59, "learning_rate": 6.114029966919633e-05, "loss": 0.0074, "step": 147300 }, { "epoch": 1.59, "learning_rate": 6.112408380359344e-05, "loss": 0.0063, "step": 147310 }, { "epoch": 1.59, "learning_rate": 6.110786793799053e-05, "loss": 0.0083, "step": 147320 }, { "epoch": 1.59, "learning_rate": 6.109165207238762e-05, "loss": 0.0085, "step": 147330 }, { "epoch": 1.59, "learning_rate": 6.107543620678472e-05, "loss": 0.0088, "step": 147340 }, { "epoch": 1.59, "learning_rate": 6.105922034118181e-05, "loss": 0.0066, "step": 147350 }, { "epoch": 1.59, "learning_rate": 6.10430044755789e-05, "loss": 0.0099, "step": 147360 }, { "epoch": 1.59, "learning_rate": 6.1026788609975995e-05, "loss": 0.007, "step": 147370 }, { "epoch": 1.59, "learning_rate": 6.101057274437309e-05, "loss": 0.0078, "step": 147380 }, { "epoch": 1.59, "learning_rate": 6.099435687877019e-05, "loss": 0.009, "step": 147390 }, { "epoch": 1.59, "learning_rate": 6.097814101316728e-05, "loss": 0.0073, "step": 147400 }, { "epoch": 1.59, "learning_rate": 6.096192514756437e-05, "loss": 0.0073, "step": 147410 }, { "epoch": 1.59, "learning_rate": 6.0945709281961465e-05, "loss": 0.0079, "step": 147420 }, { "epoch": 1.59, "learning_rate": 6.092949341635856e-05, "loss": 0.0086, "step": 147430 }, { "epoch": 1.59, "learning_rate": 6.091327755075565e-05, "loss": 0.0076, "step": 147440 }, { "epoch": 1.59, "learning_rate": 6.089706168515275e-05, "loss": 0.009, "step": 147450 }, { "epoch": 1.59, "learning_rate": 6.088084581954984e-05, "loss": 0.0072, "step": 147460 }, { "epoch": 1.59, "learning_rate": 6.0864629953946936e-05, "loss": 0.007, "step": 147470 }, { "epoch": 1.59, "learning_rate": 6.084841408834403e-05, "loss": 0.007, "step": 147480 }, { "epoch": 1.59, "learning_rate": 6.083219822274112e-05, "loss": 0.0073, "step": 147490 }, { "epoch": 1.59, "learning_rate": 6.081598235713822e-05, "loss": 0.0067, "step": 147500 }, { "epoch": 1.59, "learning_rate": 6.0799766491535314e-05, "loss": 0.007, "step": 147510 }, { "epoch": 1.59, "learning_rate": 6.0783550625932406e-05, "loss": 0.0082, "step": 147520 }, { "epoch": 1.59, "learning_rate": 6.07673347603295e-05, "loss": 0.0067, "step": 147530 }, { "epoch": 1.59, "learning_rate": 6.075111889472659e-05, "loss": 0.0072, "step": 147540 }, { "epoch": 1.6, "learning_rate": 6.073490302912369e-05, "loss": 0.009, "step": 147550 }, { "epoch": 1.6, "learning_rate": 6.0718687163520784e-05, "loss": 0.008, "step": 147560 }, { "epoch": 1.6, "learning_rate": 6.070247129791788e-05, "loss": 0.0052, "step": 147570 }, { "epoch": 1.6, "learning_rate": 6.068625543231497e-05, "loss": 0.0063, "step": 147580 }, { "epoch": 1.6, "learning_rate": 6.067003956671206e-05, "loss": 0.0095, "step": 147590 }, { "epoch": 1.6, "learning_rate": 6.0653823701109155e-05, "loss": 0.0064, "step": 147600 }, { "epoch": 1.6, "learning_rate": 6.0637607835506255e-05, "loss": 0.0082, "step": 147610 }, { "epoch": 1.6, "learning_rate": 6.062139196990335e-05, "loss": 0.0061, "step": 147620 }, { "epoch": 1.6, "learning_rate": 6.060517610430044e-05, "loss": 0.007, "step": 147630 }, { "epoch": 1.6, "learning_rate": 6.058896023869753e-05, "loss": 0.0052, "step": 147640 }, { "epoch": 1.6, "learning_rate": 6.0572744373094626e-05, "loss": 0.0089, "step": 147650 }, { "epoch": 1.6, "learning_rate": 6.0556528507491725e-05, "loss": 0.0076, "step": 147660 }, { "epoch": 1.6, "learning_rate": 6.054031264188882e-05, "loss": 0.0058, "step": 147670 }, { "epoch": 1.6, "learning_rate": 6.052409677628591e-05, "loss": 0.0092, "step": 147680 }, { "epoch": 1.6, "learning_rate": 6.0507880910683003e-05, "loss": 0.0074, "step": 147690 }, { "epoch": 1.6, "learning_rate": 6.0491665045080096e-05, "loss": 0.0071, "step": 147700 }, { "epoch": 1.6, "learning_rate": 6.047544917947719e-05, "loss": 0.0067, "step": 147710 }, { "epoch": 1.6, "learning_rate": 6.045923331387429e-05, "loss": 0.0064, "step": 147720 }, { "epoch": 1.6, "learning_rate": 6.044301744827138e-05, "loss": 0.0078, "step": 147730 }, { "epoch": 1.6, "learning_rate": 6.0426801582668474e-05, "loss": 0.0079, "step": 147740 }, { "epoch": 1.6, "learning_rate": 6.041058571706557e-05, "loss": 0.0065, "step": 147750 }, { "epoch": 1.6, "learning_rate": 6.039436985146266e-05, "loss": 0.0061, "step": 147760 }, { "epoch": 1.6, "learning_rate": 6.037815398585976e-05, "loss": 0.0078, "step": 147770 }, { "epoch": 1.6, "learning_rate": 6.036193812025685e-05, "loss": 0.0088, "step": 147780 }, { "epoch": 1.6, "learning_rate": 6.0345722254653944e-05, "loss": 0.0078, "step": 147790 }, { "epoch": 1.6, "learning_rate": 6.032950638905104e-05, "loss": 0.0082, "step": 147800 }, { "epoch": 1.6, "learning_rate": 6.031329052344813e-05, "loss": 0.0108, "step": 147810 }, { "epoch": 1.6, "learning_rate": 6.0297074657845236e-05, "loss": 0.0069, "step": 147820 }, { "epoch": 1.6, "learning_rate": 6.028085879224233e-05, "loss": 0.0063, "step": 147830 }, { "epoch": 1.6, "learning_rate": 6.026464292663942e-05, "loss": 0.0058, "step": 147840 }, { "epoch": 1.6, "learning_rate": 6.0248427061036514e-05, "loss": 0.0079, "step": 147850 }, { "epoch": 1.6, "learning_rate": 6.0232211195433614e-05, "loss": 0.0074, "step": 147860 }, { "epoch": 1.6, "learning_rate": 6.021599532983071e-05, "loss": 0.0083, "step": 147870 }, { "epoch": 1.6, "learning_rate": 6.01997794642278e-05, "loss": 0.0077, "step": 147880 }, { "epoch": 1.6, "learning_rate": 6.018356359862489e-05, "loss": 0.0078, "step": 147890 }, { "epoch": 1.6, "learning_rate": 6.0167347733021985e-05, "loss": 0.0063, "step": 147900 }, { "epoch": 1.6, "learning_rate": 6.015113186741908e-05, "loss": 0.0092, "step": 147910 }, { "epoch": 1.6, "learning_rate": 6.013491600181618e-05, "loss": 0.0079, "step": 147920 }, { "epoch": 1.6, "learning_rate": 6.011870013621327e-05, "loss": 0.0092, "step": 147930 }, { "epoch": 1.6, "learning_rate": 6.010248427061036e-05, "loss": 0.0081, "step": 147940 }, { "epoch": 1.6, "learning_rate": 6.0086268405007455e-05, "loss": 0.0089, "step": 147950 }, { "epoch": 1.6, "learning_rate": 6.007005253940455e-05, "loss": 0.0061, "step": 147960 }, { "epoch": 1.6, "learning_rate": 6.005383667380165e-05, "loss": 0.0086, "step": 147970 }, { "epoch": 1.6, "learning_rate": 6.003762080819874e-05, "loss": 0.0072, "step": 147980 }, { "epoch": 1.6, "learning_rate": 6.002140494259583e-05, "loss": 0.0075, "step": 147990 }, { "epoch": 1.6, "learning_rate": 6.0005189076992926e-05, "loss": 0.0087, "step": 148000 }, { "epoch": 1.6, "eval_cer": 0.9215364891415945, "eval_loss": 0.006136965937912464, "eval_runtime": 121.1416, "eval_samples_per_second": 16.51, "eval_steps_per_second": 4.127, "step": 148000 }, { "epoch": 1.6, "learning_rate": 5.998897321139002e-05, "loss": 0.0078, "step": 148010 }, { "epoch": 1.6, "learning_rate": 5.997275734578711e-05, "loss": 0.0073, "step": 148020 }, { "epoch": 1.6, "learning_rate": 5.995654148018421e-05, "loss": 0.0072, "step": 148030 }, { "epoch": 1.6, "learning_rate": 5.9940325614581304e-05, "loss": 0.0059, "step": 148040 }, { "epoch": 1.6, "learning_rate": 5.9924109748978396e-05, "loss": 0.0071, "step": 148050 }, { "epoch": 1.6, "learning_rate": 5.990789388337549e-05, "loss": 0.0071, "step": 148060 }, { "epoch": 1.6, "learning_rate": 5.989167801777258e-05, "loss": 0.0102, "step": 148070 }, { "epoch": 1.6, "learning_rate": 5.987546215216968e-05, "loss": 0.0062, "step": 148080 }, { "epoch": 1.6, "learning_rate": 5.9859246286566774e-05, "loss": 0.007, "step": 148090 }, { "epoch": 1.6, "learning_rate": 5.984303042096387e-05, "loss": 0.0055, "step": 148100 }, { "epoch": 1.6, "learning_rate": 5.982681455536096e-05, "loss": 0.0087, "step": 148110 }, { "epoch": 1.6, "learning_rate": 5.981059868975805e-05, "loss": 0.0077, "step": 148120 }, { "epoch": 1.6, "learning_rate": 5.979438282415515e-05, "loss": 0.0073, "step": 148130 }, { "epoch": 1.6, "learning_rate": 5.9778166958552245e-05, "loss": 0.0202, "step": 148140 }, { "epoch": 1.6, "learning_rate": 5.976195109294934e-05, "loss": 0.01, "step": 148150 }, { "epoch": 1.6, "learning_rate": 5.974573522734643e-05, "loss": 0.0071, "step": 148160 }, { "epoch": 1.6, "learning_rate": 5.972951936174352e-05, "loss": 0.0072, "step": 148170 }, { "epoch": 1.6, "learning_rate": 5.9713303496140616e-05, "loss": 0.0072, "step": 148180 }, { "epoch": 1.6, "learning_rate": 5.9697087630537715e-05, "loss": 0.0095, "step": 148190 }, { "epoch": 1.6, "learning_rate": 5.968087176493481e-05, "loss": 0.0063, "step": 148200 }, { "epoch": 1.6, "learning_rate": 5.96646558993319e-05, "loss": 0.0066, "step": 148210 }, { "epoch": 1.6, "learning_rate": 5.964844003372899e-05, "loss": 0.0064, "step": 148220 }, { "epoch": 1.6, "learning_rate": 5.9632224168126086e-05, "loss": 0.0086, "step": 148230 }, { "epoch": 1.6, "learning_rate": 5.9616008302523186e-05, "loss": 0.0066, "step": 148240 }, { "epoch": 1.6, "learning_rate": 5.959979243692028e-05, "loss": 0.0077, "step": 148250 }, { "epoch": 1.6, "learning_rate": 5.958357657131737e-05, "loss": 0.0105, "step": 148260 }, { "epoch": 1.6, "learning_rate": 5.9567360705714464e-05, "loss": 0.0068, "step": 148270 }, { "epoch": 1.6, "learning_rate": 5.9551144840111557e-05, "loss": 0.0085, "step": 148280 }, { "epoch": 1.6, "learning_rate": 5.9534928974508656e-05, "loss": 0.0092, "step": 148290 }, { "epoch": 1.6, "learning_rate": 5.951871310890575e-05, "loss": 0.0077, "step": 148300 }, { "epoch": 1.6, "learning_rate": 5.950249724330284e-05, "loss": 0.0069, "step": 148310 }, { "epoch": 1.6, "learning_rate": 5.9486281377699934e-05, "loss": 0.0067, "step": 148320 }, { "epoch": 1.6, "learning_rate": 5.947006551209703e-05, "loss": 0.0073, "step": 148330 }, { "epoch": 1.6, "learning_rate": 5.945384964649412e-05, "loss": 0.0059, "step": 148340 }, { "epoch": 1.6, "learning_rate": 5.943763378089122e-05, "loss": 0.0075, "step": 148350 }, { "epoch": 1.6, "learning_rate": 5.942141791528831e-05, "loss": 0.0105, "step": 148360 }, { "epoch": 1.6, "learning_rate": 5.9405202049685405e-05, "loss": 0.0059, "step": 148370 }, { "epoch": 1.6, "learning_rate": 5.93889861840825e-05, "loss": 0.0083, "step": 148380 }, { "epoch": 1.6, "learning_rate": 5.937277031847959e-05, "loss": 0.0073, "step": 148390 }, { "epoch": 1.6, "learning_rate": 5.935655445287669e-05, "loss": 0.0078, "step": 148400 }, { "epoch": 1.6, "learning_rate": 5.934033858727378e-05, "loss": 0.0081, "step": 148410 }, { "epoch": 1.6, "learning_rate": 5.9324122721670875e-05, "loss": 0.0087, "step": 148420 }, { "epoch": 1.6, "learning_rate": 5.930790685606797e-05, "loss": 0.0092, "step": 148430 }, { "epoch": 1.6, "learning_rate": 5.929169099046506e-05, "loss": 0.0074, "step": 148440 }, { "epoch": 1.6, "learning_rate": 5.9275475124862154e-05, "loss": 0.0075, "step": 148450 }, { "epoch": 1.6, "learning_rate": 5.925925925925925e-05, "loss": 0.0068, "step": 148460 }, { "epoch": 1.61, "learning_rate": 5.9243043393656346e-05, "loss": 0.0096, "step": 148470 }, { "epoch": 1.61, "learning_rate": 5.922682752805344e-05, "loss": 0.007, "step": 148480 }, { "epoch": 1.61, "learning_rate": 5.921061166245053e-05, "loss": 0.0085, "step": 148490 }, { "epoch": 1.61, "learning_rate": 5.9194395796847624e-05, "loss": 0.0078, "step": 148500 }, { "epoch": 1.61, "learning_rate": 5.9178179931244724e-05, "loss": 0.0085, "step": 148510 }, { "epoch": 1.61, "learning_rate": 5.9161964065641816e-05, "loss": 0.0067, "step": 148520 }, { "epoch": 1.61, "learning_rate": 5.914574820003891e-05, "loss": 0.0072, "step": 148530 }, { "epoch": 1.61, "learning_rate": 5.912953233443601e-05, "loss": 0.0095, "step": 148540 }, { "epoch": 1.61, "learning_rate": 5.911331646883311e-05, "loss": 0.0083, "step": 148550 }, { "epoch": 1.61, "learning_rate": 5.90971006032302e-05, "loss": 0.0075, "step": 148560 }, { "epoch": 1.61, "learning_rate": 5.9080884737627294e-05, "loss": 0.0081, "step": 148570 }, { "epoch": 1.61, "learning_rate": 5.9064668872024386e-05, "loss": 0.0072, "step": 148580 }, { "epoch": 1.61, "learning_rate": 5.904845300642148e-05, "loss": 0.0102, "step": 148590 }, { "epoch": 1.61, "learning_rate": 5.903223714081857e-05, "loss": 0.0067, "step": 148600 }, { "epoch": 1.61, "learning_rate": 5.901602127521567e-05, "loss": 0.0061, "step": 148610 }, { "epoch": 1.61, "learning_rate": 5.8999805409612764e-05, "loss": 0.0084, "step": 148620 }, { "epoch": 1.61, "learning_rate": 5.898358954400986e-05, "loss": 0.0068, "step": 148630 }, { "epoch": 1.61, "learning_rate": 5.896737367840695e-05, "loss": 0.0094, "step": 148640 }, { "epoch": 1.61, "learning_rate": 5.895115781280404e-05, "loss": 0.0086, "step": 148650 }, { "epoch": 1.61, "learning_rate": 5.893494194720114e-05, "loss": 0.0073, "step": 148660 }, { "epoch": 1.61, "learning_rate": 5.8918726081598235e-05, "loss": 0.006, "step": 148670 }, { "epoch": 1.61, "learning_rate": 5.890251021599533e-05, "loss": 0.0078, "step": 148680 }, { "epoch": 1.61, "learning_rate": 5.888629435039242e-05, "loss": 0.0086, "step": 148690 }, { "epoch": 1.61, "learning_rate": 5.887007848478951e-05, "loss": 0.0087, "step": 148700 }, { "epoch": 1.61, "learning_rate": 5.885386261918661e-05, "loss": 0.0059, "step": 148710 }, { "epoch": 1.61, "learning_rate": 5.8837646753583705e-05, "loss": 0.0068, "step": 148720 }, { "epoch": 1.61, "learning_rate": 5.88214308879808e-05, "loss": 0.0081, "step": 148730 }, { "epoch": 1.61, "learning_rate": 5.880521502237789e-05, "loss": 0.0104, "step": 148740 }, { "epoch": 1.61, "learning_rate": 5.878899915677498e-05, "loss": 0.0075, "step": 148750 }, { "epoch": 1.61, "learning_rate": 5.8772783291172076e-05, "loss": 0.0072, "step": 148760 }, { "epoch": 1.61, "learning_rate": 5.8756567425569176e-05, "loss": 0.0074, "step": 148770 }, { "epoch": 1.61, "learning_rate": 5.874035155996627e-05, "loss": 0.0072, "step": 148780 }, { "epoch": 1.61, "learning_rate": 5.872413569436336e-05, "loss": 0.011, "step": 148790 }, { "epoch": 1.61, "learning_rate": 5.8707919828760454e-05, "loss": 0.0082, "step": 148800 }, { "epoch": 1.61, "learning_rate": 5.8691703963157547e-05, "loss": 0.0068, "step": 148810 }, { "epoch": 1.61, "learning_rate": 5.8675488097554646e-05, "loss": 0.0074, "step": 148820 }, { "epoch": 1.61, "learning_rate": 5.865927223195174e-05, "loss": 0.0056, "step": 148830 }, { "epoch": 1.61, "learning_rate": 5.864305636634883e-05, "loss": 0.0071, "step": 148840 }, { "epoch": 1.61, "learning_rate": 5.8626840500745924e-05, "loss": 0.007, "step": 148850 }, { "epoch": 1.61, "learning_rate": 5.861062463514302e-05, "loss": 0.0075, "step": 148860 }, { "epoch": 1.61, "learning_rate": 5.8594408769540117e-05, "loss": 0.007, "step": 148870 }, { "epoch": 1.61, "learning_rate": 5.857819290393721e-05, "loss": 0.0081, "step": 148880 }, { "epoch": 1.61, "learning_rate": 5.85619770383343e-05, "loss": 0.0063, "step": 148890 }, { "epoch": 1.61, "learning_rate": 5.8545761172731395e-05, "loss": 0.0084, "step": 148900 }, { "epoch": 1.61, "learning_rate": 5.852954530712849e-05, "loss": 0.0053, "step": 148910 }, { "epoch": 1.61, "learning_rate": 5.851332944152558e-05, "loss": 0.0107, "step": 148920 }, { "epoch": 1.61, "learning_rate": 5.849711357592268e-05, "loss": 0.0086, "step": 148930 }, { "epoch": 1.61, "learning_rate": 5.848089771031977e-05, "loss": 0.0074, "step": 148940 }, { "epoch": 1.61, "learning_rate": 5.8464681844716865e-05, "loss": 0.0091, "step": 148950 }, { "epoch": 1.61, "learning_rate": 5.844846597911396e-05, "loss": 0.0066, "step": 148960 }, { "epoch": 1.61, "learning_rate": 5.843225011351105e-05, "loss": 0.0067, "step": 148970 }, { "epoch": 1.61, "learning_rate": 5.841603424790815e-05, "loss": 0.0065, "step": 148980 }, { "epoch": 1.61, "learning_rate": 5.839981838230524e-05, "loss": 0.0067, "step": 148990 }, { "epoch": 1.61, "learning_rate": 5.8383602516702336e-05, "loss": 0.0066, "step": 149000 }, { "epoch": 1.61, "eval_cer": 0.9215234600972488, "eval_loss": 0.006172089837491512, "eval_runtime": 121.2213, "eval_samples_per_second": 16.499, "eval_steps_per_second": 4.125, "step": 149000 }, { "epoch": 1.61, "learning_rate": 5.836738665109943e-05, "loss": 0.009, "step": 149010 }, { "epoch": 1.61, "learning_rate": 5.835117078549652e-05, "loss": 0.0067, "step": 149020 }, { "epoch": 1.61, "learning_rate": 5.8334954919893614e-05, "loss": 0.0061, "step": 149030 }, { "epoch": 1.61, "learning_rate": 5.8318739054290713e-05, "loss": 0.0056, "step": 149040 }, { "epoch": 1.61, "learning_rate": 5.8302523188687806e-05, "loss": 0.0071, "step": 149050 }, { "epoch": 1.61, "learning_rate": 5.82863073230849e-05, "loss": 0.0068, "step": 149060 }, { "epoch": 1.61, "learning_rate": 5.827009145748199e-05, "loss": 0.0075, "step": 149070 }, { "epoch": 1.61, "learning_rate": 5.8253875591879084e-05, "loss": 0.0088, "step": 149080 }, { "epoch": 1.61, "learning_rate": 5.8237659726276184e-05, "loss": 0.007, "step": 149090 }, { "epoch": 1.61, "learning_rate": 5.822144386067328e-05, "loss": 0.0117, "step": 149100 }, { "epoch": 1.61, "learning_rate": 5.820522799507037e-05, "loss": 0.0091, "step": 149110 }, { "epoch": 1.61, "learning_rate": 5.818901212946746e-05, "loss": 0.0083, "step": 149120 }, { "epoch": 1.61, "learning_rate": 5.8172796263864555e-05, "loss": 0.008, "step": 149130 }, { "epoch": 1.61, "learning_rate": 5.8156580398261654e-05, "loss": 0.007, "step": 149140 }, { "epoch": 1.61, "learning_rate": 5.814036453265875e-05, "loss": 0.0096, "step": 149150 }, { "epoch": 1.61, "learning_rate": 5.812414866705584e-05, "loss": 0.0094, "step": 149160 }, { "epoch": 1.61, "learning_rate": 5.810793280145293e-05, "loss": 0.0073, "step": 149170 }, { "epoch": 1.61, "learning_rate": 5.8091716935850025e-05, "loss": 0.0087, "step": 149180 }, { "epoch": 1.61, "learning_rate": 5.807550107024712e-05, "loss": 0.0059, "step": 149190 }, { "epoch": 1.61, "learning_rate": 5.805928520464422e-05, "loss": 0.0071, "step": 149200 }, { "epoch": 1.61, "learning_rate": 5.804306933904131e-05, "loss": 0.0113, "step": 149210 }, { "epoch": 1.61, "learning_rate": 5.80268534734384e-05, "loss": 0.0097, "step": 149220 }, { "epoch": 1.61, "learning_rate": 5.8010637607835496e-05, "loss": 0.0067, "step": 149230 }, { "epoch": 1.61, "learning_rate": 5.799442174223259e-05, "loss": 0.0089, "step": 149240 }, { "epoch": 1.61, "learning_rate": 5.797820587662969e-05, "loss": 0.006, "step": 149250 }, { "epoch": 1.61, "learning_rate": 5.796199001102679e-05, "loss": 0.0105, "step": 149260 }, { "epoch": 1.61, "learning_rate": 5.794577414542388e-05, "loss": 0.0062, "step": 149270 }, { "epoch": 1.61, "learning_rate": 5.792955827982097e-05, "loss": 0.0071, "step": 149280 }, { "epoch": 1.61, "learning_rate": 5.791334241421807e-05, "loss": 0.0061, "step": 149290 }, { "epoch": 1.61, "learning_rate": 5.7897126548615165e-05, "loss": 0.0066, "step": 149300 }, { "epoch": 1.61, "learning_rate": 5.788091068301226e-05, "loss": 0.0091, "step": 149310 }, { "epoch": 1.61, "learning_rate": 5.786469481740935e-05, "loss": 0.0074, "step": 149320 }, { "epoch": 1.61, "learning_rate": 5.7848478951806444e-05, "loss": 0.0094, "step": 149330 }, { "epoch": 1.61, "learning_rate": 5.7832263086203536e-05, "loss": 0.0086, "step": 149340 }, { "epoch": 1.61, "learning_rate": 5.7816047220600636e-05, "loss": 0.0063, "step": 149350 }, { "epoch": 1.61, "learning_rate": 5.779983135499773e-05, "loss": 0.0085, "step": 149360 }, { "epoch": 1.61, "learning_rate": 5.778361548939482e-05, "loss": 0.0089, "step": 149370 }, { "epoch": 1.61, "learning_rate": 5.7767399623791914e-05, "loss": 0.0075, "step": 149380 }, { "epoch": 1.61, "learning_rate": 5.775118375818901e-05, "loss": 0.0045, "step": 149390 }, { "epoch": 1.62, "learning_rate": 5.7734967892586106e-05, "loss": 0.0076, "step": 149400 }, { "epoch": 1.62, "learning_rate": 5.77187520269832e-05, "loss": 0.0073, "step": 149410 }, { "epoch": 1.62, "learning_rate": 5.770253616138029e-05, "loss": 0.006, "step": 149420 }, { "epoch": 1.62, "learning_rate": 5.7686320295777385e-05, "loss": 0.0063, "step": 149430 }, { "epoch": 1.62, "learning_rate": 5.767010443017448e-05, "loss": 0.0085, "step": 149440 }, { "epoch": 1.62, "learning_rate": 5.765388856457158e-05, "loss": 0.0078, "step": 149450 }, { "epoch": 1.62, "learning_rate": 5.763767269896867e-05, "loss": 0.0068, "step": 149460 }, { "epoch": 1.62, "learning_rate": 5.762145683336576e-05, "loss": 0.0071, "step": 149470 }, { "epoch": 1.62, "learning_rate": 5.7605240967762855e-05, "loss": 0.0097, "step": 149480 }, { "epoch": 1.62, "learning_rate": 5.758902510215995e-05, "loss": 0.0061, "step": 149490 }, { "epoch": 1.62, "learning_rate": 5.757280923655704e-05, "loss": 0.0058, "step": 149500 }, { "epoch": 1.62, "learning_rate": 5.755659337095414e-05, "loss": 0.0089, "step": 149510 }, { "epoch": 1.62, "learning_rate": 5.754037750535123e-05, "loss": 0.0079, "step": 149520 }, { "epoch": 1.62, "learning_rate": 5.7524161639748326e-05, "loss": 0.007, "step": 149530 }, { "epoch": 1.62, "learning_rate": 5.750794577414542e-05, "loss": 0.0067, "step": 149540 }, { "epoch": 1.62, "learning_rate": 5.749172990854251e-05, "loss": 0.0085, "step": 149550 }, { "epoch": 1.62, "learning_rate": 5.747551404293961e-05, "loss": 0.0078, "step": 149560 }, { "epoch": 1.62, "learning_rate": 5.7459298177336703e-05, "loss": 0.0073, "step": 149570 }, { "epoch": 1.62, "learning_rate": 5.7443082311733796e-05, "loss": 0.0063, "step": 149580 }, { "epoch": 1.62, "learning_rate": 5.742686644613089e-05, "loss": 0.0106, "step": 149590 }, { "epoch": 1.62, "learning_rate": 5.741065058052798e-05, "loss": 0.0071, "step": 149600 }, { "epoch": 1.62, "learning_rate": 5.7394434714925074e-05, "loss": 0.0073, "step": 149610 }, { "epoch": 1.62, "learning_rate": 5.7378218849322174e-05, "loss": 0.0095, "step": 149620 }, { "epoch": 1.62, "learning_rate": 5.736200298371927e-05, "loss": 0.0071, "step": 149630 }, { "epoch": 1.62, "learning_rate": 5.734578711811636e-05, "loss": 0.0097, "step": 149640 }, { "epoch": 1.62, "learning_rate": 5.732957125251345e-05, "loss": 0.011, "step": 149650 }, { "epoch": 1.62, "learning_rate": 5.7313355386910545e-05, "loss": 0.0098, "step": 149660 }, { "epoch": 1.62, "learning_rate": 5.7297139521307644e-05, "loss": 0.0068, "step": 149670 }, { "epoch": 1.62, "learning_rate": 5.728092365570474e-05, "loss": 0.0067, "step": 149680 }, { "epoch": 1.62, "learning_rate": 5.726470779010183e-05, "loss": 0.0091, "step": 149690 }, { "epoch": 1.62, "learning_rate": 5.724849192449892e-05, "loss": 0.0108, "step": 149700 }, { "epoch": 1.62, "learning_rate": 5.7232276058896015e-05, "loss": 0.0108, "step": 149710 }, { "epoch": 1.62, "learning_rate": 5.7216060193293115e-05, "loss": 0.0076, "step": 149720 }, { "epoch": 1.62, "learning_rate": 5.719984432769021e-05, "loss": 0.0059, "step": 149730 }, { "epoch": 1.62, "learning_rate": 5.71836284620873e-05, "loss": 0.0084, "step": 149740 }, { "epoch": 1.62, "learning_rate": 5.716741259648439e-05, "loss": 0.007, "step": 149750 }, { "epoch": 1.62, "learning_rate": 5.7151196730881486e-05, "loss": 0.008, "step": 149760 }, { "epoch": 1.62, "learning_rate": 5.713498086527858e-05, "loss": 0.0064, "step": 149770 }, { "epoch": 1.62, "learning_rate": 5.711876499967568e-05, "loss": 0.0067, "step": 149780 }, { "epoch": 1.62, "learning_rate": 5.710254913407277e-05, "loss": 0.0089, "step": 149790 }, { "epoch": 1.62, "learning_rate": 5.7086333268469864e-05, "loss": 0.0071, "step": 149800 }, { "epoch": 1.62, "learning_rate": 5.7070117402866956e-05, "loss": 0.0069, "step": 149810 }, { "epoch": 1.62, "learning_rate": 5.705390153726405e-05, "loss": 0.0087, "step": 149820 }, { "epoch": 1.62, "learning_rate": 5.703768567166115e-05, "loss": 0.0079, "step": 149830 }, { "epoch": 1.62, "learning_rate": 5.702146980605824e-05, "loss": 0.009, "step": 149840 }, { "epoch": 1.62, "learning_rate": 5.7005253940455334e-05, "loss": 0.0075, "step": 149850 }, { "epoch": 1.62, "learning_rate": 5.698903807485243e-05, "loss": 0.0125, "step": 149860 }, { "epoch": 1.62, "learning_rate": 5.697282220924952e-05, "loss": 0.0078, "step": 149870 }, { "epoch": 1.62, "learning_rate": 5.695660634364662e-05, "loss": 0.009, "step": 149880 }, { "epoch": 1.62, "learning_rate": 5.694039047804371e-05, "loss": 0.0087, "step": 149890 }, { "epoch": 1.62, "learning_rate": 5.6924174612440805e-05, "loss": 0.009, "step": 149900 }, { "epoch": 1.62, "learning_rate": 5.69079587468379e-05, "loss": 0.0067, "step": 149910 }, { "epoch": 1.62, "learning_rate": 5.689174288123499e-05, "loss": 0.0091, "step": 149920 }, { "epoch": 1.62, "learning_rate": 5.687552701563208e-05, "loss": 0.007, "step": 149930 }, { "epoch": 1.62, "learning_rate": 5.685931115002918e-05, "loss": 0.0075, "step": 149940 }, { "epoch": 1.62, "learning_rate": 5.6843095284426275e-05, "loss": 0.0065, "step": 149950 }, { "epoch": 1.62, "learning_rate": 5.682687941882337e-05, "loss": 0.0093, "step": 149960 }, { "epoch": 1.62, "learning_rate": 5.681066355322046e-05, "loss": 0.0063, "step": 149970 }, { "epoch": 1.62, "learning_rate": 5.679444768761757e-05, "loss": 0.0077, "step": 149980 }, { "epoch": 1.62, "learning_rate": 5.677823182201466e-05, "loss": 0.0087, "step": 149990 }, { "epoch": 1.62, "learning_rate": 5.676201595641175e-05, "loss": 0.0087, "step": 150000 }, { "epoch": 1.62, "eval_cer": 0.9215086938469904, "eval_loss": 0.006060704588890076, "eval_runtime": 121.178, "eval_samples_per_second": 16.505, "eval_steps_per_second": 4.126, "step": 150000 }, { "epoch": 1.62, "learning_rate": 5.6745800090808845e-05, "loss": 0.0092, "step": 150010 }, { "epoch": 1.62, "learning_rate": 5.672958422520594e-05, "loss": 0.0085, "step": 150020 }, { "epoch": 1.62, "learning_rate": 5.671336835960304e-05, "loss": 0.0049, "step": 150030 }, { "epoch": 1.62, "learning_rate": 5.669715249400013e-05, "loss": 0.0063, "step": 150040 }, { "epoch": 1.62, "learning_rate": 5.668093662839722e-05, "loss": 0.0065, "step": 150050 }, { "epoch": 1.62, "learning_rate": 5.6664720762794316e-05, "loss": 0.007, "step": 150060 }, { "epoch": 1.62, "learning_rate": 5.664850489719141e-05, "loss": 0.0073, "step": 150070 }, { "epoch": 1.62, "learning_rate": 5.66322890315885e-05, "loss": 0.0064, "step": 150080 }, { "epoch": 1.62, "learning_rate": 5.66160731659856e-05, "loss": 0.0066, "step": 150090 }, { "epoch": 1.62, "learning_rate": 5.659985730038269e-05, "loss": 0.0073, "step": 150100 }, { "epoch": 1.62, "learning_rate": 5.6583641434779786e-05, "loss": 0.0062, "step": 150110 }, { "epoch": 1.62, "learning_rate": 5.656742556917688e-05, "loss": 0.0077, "step": 150120 }, { "epoch": 1.62, "learning_rate": 5.655120970357397e-05, "loss": 0.0064, "step": 150130 }, { "epoch": 1.62, "learning_rate": 5.653499383797107e-05, "loss": 0.0062, "step": 150140 }, { "epoch": 1.62, "learning_rate": 5.6518777972368164e-05, "loss": 0.008, "step": 150150 }, { "epoch": 1.62, "learning_rate": 5.650256210676526e-05, "loss": 0.0066, "step": 150160 }, { "epoch": 1.62, "learning_rate": 5.648634624116235e-05, "loss": 0.0085, "step": 150170 }, { "epoch": 1.62, "learning_rate": 5.647013037555944e-05, "loss": 0.0114, "step": 150180 }, { "epoch": 1.62, "learning_rate": 5.6453914509956535e-05, "loss": 0.0087, "step": 150190 }, { "epoch": 1.62, "learning_rate": 5.6437698644353634e-05, "loss": 0.0072, "step": 150200 }, { "epoch": 1.62, "learning_rate": 5.642148277875073e-05, "loss": 0.0116, "step": 150210 }, { "epoch": 1.62, "learning_rate": 5.640526691314782e-05, "loss": 0.0077, "step": 150220 }, { "epoch": 1.62, "learning_rate": 5.638905104754491e-05, "loss": 0.0082, "step": 150230 }, { "epoch": 1.62, "learning_rate": 5.6372835181942005e-05, "loss": 0.0072, "step": 150240 }, { "epoch": 1.62, "learning_rate": 5.6356619316339105e-05, "loss": 0.0075, "step": 150250 }, { "epoch": 1.62, "learning_rate": 5.63404034507362e-05, "loss": 0.0059, "step": 150260 }, { "epoch": 1.62, "learning_rate": 5.632418758513329e-05, "loss": 0.0075, "step": 150270 }, { "epoch": 1.62, "learning_rate": 5.630797171953038e-05, "loss": 0.0086, "step": 150280 }, { "epoch": 1.62, "learning_rate": 5.6291755853927476e-05, "loss": 0.0073, "step": 150290 }, { "epoch": 1.62, "learning_rate": 5.6275539988324575e-05, "loss": 0.0088, "step": 150300 }, { "epoch": 1.62, "learning_rate": 5.625932412272167e-05, "loss": 0.0062, "step": 150310 }, { "epoch": 1.63, "learning_rate": 5.624310825711876e-05, "loss": 0.0075, "step": 150320 }, { "epoch": 1.63, "learning_rate": 5.6226892391515854e-05, "loss": 0.0063, "step": 150330 }, { "epoch": 1.63, "learning_rate": 5.6210676525912946e-05, "loss": 0.0071, "step": 150340 }, { "epoch": 1.63, "learning_rate": 5.619446066031004e-05, "loss": 0.0085, "step": 150350 }, { "epoch": 1.63, "learning_rate": 5.617824479470714e-05, "loss": 0.0066, "step": 150360 }, { "epoch": 1.63, "learning_rate": 5.616202892910423e-05, "loss": 0.0091, "step": 150370 }, { "epoch": 1.63, "learning_rate": 5.6145813063501324e-05, "loss": 0.006, "step": 150380 }, { "epoch": 1.63, "learning_rate": 5.612959719789842e-05, "loss": 0.0082, "step": 150390 }, { "epoch": 1.63, "learning_rate": 5.611338133229551e-05, "loss": 0.0086, "step": 150400 }, { "epoch": 1.63, "learning_rate": 5.609716546669261e-05, "loss": 0.0063, "step": 150410 }, { "epoch": 1.63, "learning_rate": 5.60809496010897e-05, "loss": 0.0079, "step": 150420 }, { "epoch": 1.63, "learning_rate": 5.6064733735486795e-05, "loss": 0.0084, "step": 150430 }, { "epoch": 1.63, "learning_rate": 5.604851786988389e-05, "loss": 0.0067, "step": 150440 }, { "epoch": 1.63, "learning_rate": 5.603230200428098e-05, "loss": 0.0065, "step": 150450 }, { "epoch": 1.63, "learning_rate": 5.601608613867808e-05, "loss": 0.0052, "step": 150460 }, { "epoch": 1.63, "learning_rate": 5.599987027307517e-05, "loss": 0.0061, "step": 150470 }, { "epoch": 1.63, "learning_rate": 5.5983654407472265e-05, "loss": 0.0088, "step": 150480 }, { "epoch": 1.63, "learning_rate": 5.596743854186936e-05, "loss": 0.0073, "step": 150490 }, { "epoch": 1.63, "learning_rate": 5.595122267626645e-05, "loss": 0.0075, "step": 150500 }, { "epoch": 1.63, "learning_rate": 5.593500681066354e-05, "loss": 0.0073, "step": 150510 }, { "epoch": 1.63, "learning_rate": 5.591879094506064e-05, "loss": 0.0087, "step": 150520 }, { "epoch": 1.63, "learning_rate": 5.5902575079457736e-05, "loss": 0.0064, "step": 150530 }, { "epoch": 1.63, "learning_rate": 5.588635921385483e-05, "loss": 0.0081, "step": 150540 }, { "epoch": 1.63, "learning_rate": 5.587014334825192e-05, "loss": 0.0088, "step": 150550 }, { "epoch": 1.63, "learning_rate": 5.5853927482649014e-05, "loss": 0.0076, "step": 150560 }, { "epoch": 1.63, "learning_rate": 5.583771161704611e-05, "loss": 0.0065, "step": 150570 }, { "epoch": 1.63, "learning_rate": 5.5821495751443206e-05, "loss": 0.0079, "step": 150580 }, { "epoch": 1.63, "learning_rate": 5.58052798858403e-05, "loss": 0.0087, "step": 150590 }, { "epoch": 1.63, "learning_rate": 5.578906402023739e-05, "loss": 0.0092, "step": 150600 }, { "epoch": 1.63, "learning_rate": 5.5772848154634484e-05, "loss": 0.0081, "step": 150610 }, { "epoch": 1.63, "learning_rate": 5.575663228903158e-05, "loss": 0.0045, "step": 150620 }, { "epoch": 1.63, "learning_rate": 5.5740416423428677e-05, "loss": 0.0064, "step": 150630 }, { "epoch": 1.63, "learning_rate": 5.572420055782577e-05, "loss": 0.0107, "step": 150640 }, { "epoch": 1.63, "learning_rate": 5.570798469222286e-05, "loss": 0.008, "step": 150650 }, { "epoch": 1.63, "learning_rate": 5.5691768826619955e-05, "loss": 0.0087, "step": 150660 }, { "epoch": 1.63, "learning_rate": 5.567555296101705e-05, "loss": 0.0075, "step": 150670 }, { "epoch": 1.63, "learning_rate": 5.565933709541415e-05, "loss": 0.0078, "step": 150680 }, { "epoch": 1.63, "learning_rate": 5.564312122981124e-05, "loss": 0.0092, "step": 150690 }, { "epoch": 1.63, "learning_rate": 5.562690536420834e-05, "loss": 0.0088, "step": 150700 }, { "epoch": 1.63, "learning_rate": 5.561068949860543e-05, "loss": 0.007, "step": 150710 }, { "epoch": 1.63, "learning_rate": 5.559447363300253e-05, "loss": 0.0072, "step": 150720 }, { "epoch": 1.63, "learning_rate": 5.5578257767399624e-05, "loss": 0.0074, "step": 150730 }, { "epoch": 1.63, "learning_rate": 5.556204190179672e-05, "loss": 0.0078, "step": 150740 }, { "epoch": 1.63, "learning_rate": 5.554582603619381e-05, "loss": 0.007, "step": 150750 }, { "epoch": 1.63, "learning_rate": 5.55296101705909e-05, "loss": 0.0125, "step": 150760 }, { "epoch": 1.63, "learning_rate": 5.5513394304987995e-05, "loss": 0.0087, "step": 150770 }, { "epoch": 1.63, "learning_rate": 5.5497178439385095e-05, "loss": 0.0085, "step": 150780 }, { "epoch": 1.63, "learning_rate": 5.548096257378219e-05, "loss": 0.0073, "step": 150790 }, { "epoch": 1.63, "learning_rate": 5.546474670817928e-05, "loss": 0.0067, "step": 150800 }, { "epoch": 1.63, "learning_rate": 5.544853084257637e-05, "loss": 0.0062, "step": 150810 }, { "epoch": 1.63, "learning_rate": 5.5432314976973466e-05, "loss": 0.0097, "step": 150820 }, { "epoch": 1.63, "learning_rate": 5.5416099111370565e-05, "loss": 0.0052, "step": 150830 }, { "epoch": 1.63, "learning_rate": 5.539988324576766e-05, "loss": 0.007, "step": 150840 }, { "epoch": 1.63, "learning_rate": 5.538366738016475e-05, "loss": 0.0067, "step": 150850 }, { "epoch": 1.63, "learning_rate": 5.5367451514561844e-05, "loss": 0.0066, "step": 150860 }, { "epoch": 1.63, "learning_rate": 5.5351235648958936e-05, "loss": 0.0063, "step": 150870 }, { "epoch": 1.63, "learning_rate": 5.5335019783356036e-05, "loss": 0.0063, "step": 150880 }, { "epoch": 1.63, "learning_rate": 5.531880391775313e-05, "loss": 0.0056, "step": 150890 }, { "epoch": 1.63, "learning_rate": 5.530258805215022e-05, "loss": 0.0091, "step": 150900 }, { "epoch": 1.63, "learning_rate": 5.5286372186547314e-05, "loss": 0.0078, "step": 150910 }, { "epoch": 1.63, "learning_rate": 5.527015632094441e-05, "loss": 0.007, "step": 150920 }, { "epoch": 1.63, "learning_rate": 5.52539404553415e-05, "loss": 0.0084, "step": 150930 }, { "epoch": 1.63, "learning_rate": 5.52377245897386e-05, "loss": 0.0071, "step": 150940 }, { "epoch": 1.63, "learning_rate": 5.522150872413569e-05, "loss": 0.0075, "step": 150950 }, { "epoch": 1.63, "learning_rate": 5.5205292858532785e-05, "loss": 0.0061, "step": 150960 }, { "epoch": 1.63, "learning_rate": 5.518907699292988e-05, "loss": 0.0087, "step": 150970 }, { "epoch": 1.63, "learning_rate": 5.517286112732697e-05, "loss": 0.0076, "step": 150980 }, { "epoch": 1.63, "learning_rate": 5.515664526172407e-05, "loss": 0.0071, "step": 150990 }, { "epoch": 1.63, "learning_rate": 5.514042939612116e-05, "loss": 0.0059, "step": 151000 }, { "epoch": 1.63, "eval_cer": 0.9215286717149871, "eval_loss": 0.0059387171640992165, "eval_runtime": 121.2054, "eval_samples_per_second": 16.501, "eval_steps_per_second": 4.125, "step": 151000 }, { "epoch": 1.63, "learning_rate": 5.5124213530518255e-05, "loss": 0.0106, "step": 151010 }, { "epoch": 1.63, "learning_rate": 5.510799766491535e-05, "loss": 0.0064, "step": 151020 }, { "epoch": 1.63, "learning_rate": 5.509178179931244e-05, "loss": 0.0057, "step": 151030 }, { "epoch": 1.63, "learning_rate": 5.507556593370954e-05, "loss": 0.0071, "step": 151040 }, { "epoch": 1.63, "learning_rate": 5.505935006810663e-05, "loss": 0.008, "step": 151050 }, { "epoch": 1.63, "learning_rate": 5.5043134202503726e-05, "loss": 0.0069, "step": 151060 }, { "epoch": 1.63, "learning_rate": 5.502691833690082e-05, "loss": 0.009, "step": 151070 }, { "epoch": 1.63, "learning_rate": 5.501070247129791e-05, "loss": 0.0056, "step": 151080 }, { "epoch": 1.63, "learning_rate": 5.4994486605695004e-05, "loss": 0.0074, "step": 151090 }, { "epoch": 1.63, "learning_rate": 5.49782707400921e-05, "loss": 0.0077, "step": 151100 }, { "epoch": 1.63, "learning_rate": 5.4962054874489196e-05, "loss": 0.0063, "step": 151110 }, { "epoch": 1.63, "learning_rate": 5.494583900888629e-05, "loss": 0.0086, "step": 151120 }, { "epoch": 1.63, "learning_rate": 5.492962314328338e-05, "loss": 0.0069, "step": 151130 }, { "epoch": 1.63, "learning_rate": 5.4913407277680474e-05, "loss": 0.0096, "step": 151140 }, { "epoch": 1.63, "learning_rate": 5.4897191412077574e-05, "loss": 0.0069, "step": 151150 }, { "epoch": 1.63, "learning_rate": 5.4880975546474666e-05, "loss": 0.0076, "step": 151160 }, { "epoch": 1.63, "learning_rate": 5.486475968087176e-05, "loss": 0.0058, "step": 151170 }, { "epoch": 1.63, "learning_rate": 5.484854381526885e-05, "loss": 0.006, "step": 151180 }, { "epoch": 1.63, "learning_rate": 5.4832327949665945e-05, "loss": 0.0061, "step": 151190 }, { "epoch": 1.63, "learning_rate": 5.481611208406304e-05, "loss": 0.0073, "step": 151200 }, { "epoch": 1.63, "learning_rate": 5.479989621846014e-05, "loss": 0.0067, "step": 151210 }, { "epoch": 1.63, "learning_rate": 5.478368035285723e-05, "loss": 0.0078, "step": 151220 }, { "epoch": 1.63, "learning_rate": 5.476746448725432e-05, "loss": 0.0086, "step": 151230 }, { "epoch": 1.63, "learning_rate": 5.4751248621651415e-05, "loss": 0.0082, "step": 151240 }, { "epoch": 1.64, "learning_rate": 5.473503275604851e-05, "loss": 0.0064, "step": 151250 }, { "epoch": 1.64, "learning_rate": 5.471881689044561e-05, "loss": 0.0073, "step": 151260 }, { "epoch": 1.64, "learning_rate": 5.47026010248427e-05, "loss": 0.0119, "step": 151270 }, { "epoch": 1.64, "learning_rate": 5.468638515923979e-05, "loss": 0.0077, "step": 151280 }, { "epoch": 1.64, "learning_rate": 5.4670169293636886e-05, "loss": 0.0097, "step": 151290 }, { "epoch": 1.64, "learning_rate": 5.465395342803398e-05, "loss": 0.0085, "step": 151300 }, { "epoch": 1.64, "learning_rate": 5.463773756243108e-05, "loss": 0.0055, "step": 151310 }, { "epoch": 1.64, "learning_rate": 5.462152169682817e-05, "loss": 0.0069, "step": 151320 }, { "epoch": 1.64, "learning_rate": 5.4605305831225263e-05, "loss": 0.0082, "step": 151330 }, { "epoch": 1.64, "learning_rate": 5.4589089965622356e-05, "loss": 0.0088, "step": 151340 }, { "epoch": 1.64, "learning_rate": 5.457287410001945e-05, "loss": 0.0058, "step": 151350 }, { "epoch": 1.64, "learning_rate": 5.455665823441654e-05, "loss": 0.0071, "step": 151360 }, { "epoch": 1.64, "learning_rate": 5.454044236881364e-05, "loss": 0.0104, "step": 151370 }, { "epoch": 1.64, "learning_rate": 5.4524226503210734e-05, "loss": 0.0083, "step": 151380 }, { "epoch": 1.64, "learning_rate": 5.450801063760783e-05, "loss": 0.008, "step": 151390 }, { "epoch": 1.64, "learning_rate": 5.449179477200492e-05, "loss": 0.0072, "step": 151400 }, { "epoch": 1.64, "learning_rate": 5.447557890640201e-05, "loss": 0.0073, "step": 151410 }, { "epoch": 1.64, "learning_rate": 5.445936304079912e-05, "loss": 0.0084, "step": 151420 }, { "epoch": 1.64, "learning_rate": 5.444314717519621e-05, "loss": 0.0089, "step": 151430 }, { "epoch": 1.64, "learning_rate": 5.4426931309593304e-05, "loss": 0.0074, "step": 151440 }, { "epoch": 1.64, "learning_rate": 5.44107154439904e-05, "loss": 0.0065, "step": 151450 }, { "epoch": 1.64, "learning_rate": 5.4394499578387496e-05, "loss": 0.0068, "step": 151460 }, { "epoch": 1.64, "learning_rate": 5.437828371278459e-05, "loss": 0.0067, "step": 151470 }, { "epoch": 1.64, "learning_rate": 5.436206784718168e-05, "loss": 0.0086, "step": 151480 }, { "epoch": 1.64, "learning_rate": 5.4345851981578774e-05, "loss": 0.0049, "step": 151490 }, { "epoch": 1.64, "learning_rate": 5.432963611597587e-05, "loss": 0.0054, "step": 151500 }, { "epoch": 1.64, "learning_rate": 5.431342025037296e-05, "loss": 0.0059, "step": 151510 }, { "epoch": 1.64, "learning_rate": 5.429720438477006e-05, "loss": 0.008, "step": 151520 }, { "epoch": 1.64, "learning_rate": 5.428098851916715e-05, "loss": 0.0063, "step": 151530 }, { "epoch": 1.64, "learning_rate": 5.4264772653564245e-05, "loss": 0.0051, "step": 151540 }, { "epoch": 1.64, "learning_rate": 5.424855678796134e-05, "loss": 0.007, "step": 151550 }, { "epoch": 1.64, "learning_rate": 5.423234092235843e-05, "loss": 0.0082, "step": 151560 }, { "epoch": 1.64, "learning_rate": 5.421612505675553e-05, "loss": 0.0061, "step": 151570 }, { "epoch": 1.64, "learning_rate": 5.419990919115262e-05, "loss": 0.0075, "step": 151580 }, { "epoch": 1.64, "learning_rate": 5.4183693325549715e-05, "loss": 0.0074, "step": 151590 }, { "epoch": 1.64, "learning_rate": 5.416747745994681e-05, "loss": 0.0041, "step": 151600 }, { "epoch": 1.64, "learning_rate": 5.41512615943439e-05, "loss": 0.0083, "step": 151610 }, { "epoch": 1.64, "learning_rate": 5.4135045728741e-05, "loss": 0.0075, "step": 151620 }, { "epoch": 1.64, "learning_rate": 5.411882986313809e-05, "loss": 0.0078, "step": 151630 }, { "epoch": 1.64, "learning_rate": 5.4102613997535186e-05, "loss": 0.0072, "step": 151640 }, { "epoch": 1.64, "learning_rate": 5.408639813193228e-05, "loss": 0.0081, "step": 151650 }, { "epoch": 1.64, "learning_rate": 5.407018226632937e-05, "loss": 0.0064, "step": 151660 }, { "epoch": 1.64, "learning_rate": 5.4053966400726464e-05, "loss": 0.0077, "step": 151670 }, { "epoch": 1.64, "learning_rate": 5.4037750535123564e-05, "loss": 0.0096, "step": 151680 }, { "epoch": 1.64, "learning_rate": 5.4021534669520656e-05, "loss": 0.0068, "step": 151690 }, { "epoch": 1.64, "learning_rate": 5.400531880391775e-05, "loss": 0.0081, "step": 151700 }, { "epoch": 1.64, "learning_rate": 5.398910293831484e-05, "loss": 0.0089, "step": 151710 }, { "epoch": 1.64, "learning_rate": 5.3972887072711935e-05, "loss": 0.0078, "step": 151720 }, { "epoch": 1.64, "learning_rate": 5.3956671207109034e-05, "loss": 0.0062, "step": 151730 }, { "epoch": 1.64, "learning_rate": 5.394045534150613e-05, "loss": 0.0056, "step": 151740 }, { "epoch": 1.64, "learning_rate": 5.392423947590322e-05, "loss": 0.0064, "step": 151750 }, { "epoch": 1.64, "learning_rate": 5.390802361030031e-05, "loss": 0.0074, "step": 151760 }, { "epoch": 1.64, "learning_rate": 5.3891807744697405e-05, "loss": 0.0091, "step": 151770 }, { "epoch": 1.64, "learning_rate": 5.38755918790945e-05, "loss": 0.009, "step": 151780 }, { "epoch": 1.64, "learning_rate": 5.38593760134916e-05, "loss": 0.0081, "step": 151790 }, { "epoch": 1.64, "learning_rate": 5.384316014788869e-05, "loss": 0.0078, "step": 151800 }, { "epoch": 1.64, "learning_rate": 5.382694428228578e-05, "loss": 0.0077, "step": 151810 }, { "epoch": 1.64, "learning_rate": 5.3810728416682876e-05, "loss": 0.0064, "step": 151820 }, { "epoch": 1.64, "learning_rate": 5.379451255107997e-05, "loss": 0.008, "step": 151830 }, { "epoch": 1.64, "learning_rate": 5.377829668547707e-05, "loss": 0.0066, "step": 151840 }, { "epoch": 1.64, "learning_rate": 5.376208081987416e-05, "loss": 0.006, "step": 151850 }, { "epoch": 1.64, "learning_rate": 5.3745864954271253e-05, "loss": 0.0121, "step": 151860 }, { "epoch": 1.64, "learning_rate": 5.3729649088668346e-05, "loss": 0.0094, "step": 151870 }, { "epoch": 1.64, "learning_rate": 5.371343322306544e-05, "loss": 0.0081, "step": 151880 }, { "epoch": 1.64, "learning_rate": 5.369721735746254e-05, "loss": 0.0083, "step": 151890 }, { "epoch": 1.64, "learning_rate": 5.368100149185963e-05, "loss": 0.0061, "step": 151900 }, { "epoch": 1.64, "learning_rate": 5.3664785626256724e-05, "loss": 0.0061, "step": 151910 }, { "epoch": 1.64, "learning_rate": 5.364856976065382e-05, "loss": 0.0069, "step": 151920 }, { "epoch": 1.64, "learning_rate": 5.363235389505091e-05, "loss": 0.0063, "step": 151930 }, { "epoch": 1.64, "learning_rate": 5.3616138029448e-05, "loss": 0.0066, "step": 151940 }, { "epoch": 1.64, "learning_rate": 5.35999221638451e-05, "loss": 0.0083, "step": 151950 }, { "epoch": 1.64, "learning_rate": 5.3583706298242194e-05, "loss": 0.0065, "step": 151960 }, { "epoch": 1.64, "learning_rate": 5.356749043263929e-05, "loss": 0.0104, "step": 151970 }, { "epoch": 1.64, "learning_rate": 5.355127456703638e-05, "loss": 0.008, "step": 151980 }, { "epoch": 1.64, "learning_rate": 5.353505870143347e-05, "loss": 0.0068, "step": 151990 }, { "epoch": 1.64, "learning_rate": 5.351884283583057e-05, "loss": 0.0086, "step": 152000 }, { "epoch": 1.64, "eval_cer": 0.9215173798765541, "eval_loss": 0.005879946518689394, "eval_runtime": 121.1735, "eval_samples_per_second": 16.505, "eval_steps_per_second": 4.126, "step": 152000 }, { "epoch": 1.64, "learning_rate": 5.3502626970227665e-05, "loss": 0.0068, "step": 152010 }, { "epoch": 1.64, "learning_rate": 5.348641110462476e-05, "loss": 0.0074, "step": 152020 }, { "epoch": 1.64, "learning_rate": 5.347019523902185e-05, "loss": 0.0079, "step": 152030 }, { "epoch": 1.64, "learning_rate": 5.345397937341894e-05, "loss": 0.0062, "step": 152040 }, { "epoch": 1.64, "learning_rate": 5.343776350781604e-05, "loss": 0.0071, "step": 152050 }, { "epoch": 1.64, "learning_rate": 5.3421547642213135e-05, "loss": 0.0062, "step": 152060 }, { "epoch": 1.64, "learning_rate": 5.340533177661023e-05, "loss": 0.008, "step": 152070 }, { "epoch": 1.64, "learning_rate": 5.338911591100732e-05, "loss": 0.0068, "step": 152080 }, { "epoch": 1.64, "learning_rate": 5.3372900045404414e-05, "loss": 0.0074, "step": 152090 }, { "epoch": 1.64, "learning_rate": 5.3356684179801506e-05, "loss": 0.0086, "step": 152100 }, { "epoch": 1.64, "learning_rate": 5.3340468314198606e-05, "loss": 0.0063, "step": 152110 }, { "epoch": 1.64, "learning_rate": 5.33242524485957e-05, "loss": 0.0057, "step": 152120 }, { "epoch": 1.64, "learning_rate": 5.330803658299279e-05, "loss": 0.0068, "step": 152130 }, { "epoch": 1.64, "learning_rate": 5.329182071738989e-05, "loss": 0.0087, "step": 152140 }, { "epoch": 1.64, "learning_rate": 5.327560485178699e-05, "loss": 0.0081, "step": 152150 }, { "epoch": 1.64, "learning_rate": 5.325938898618408e-05, "loss": 0.0066, "step": 152160 }, { "epoch": 1.65, "learning_rate": 5.3243173120581176e-05, "loss": 0.0057, "step": 152170 }, { "epoch": 1.65, "learning_rate": 5.322695725497827e-05, "loss": 0.0066, "step": 152180 }, { "epoch": 1.65, "learning_rate": 5.321074138937536e-05, "loss": 0.0062, "step": 152190 }, { "epoch": 1.65, "learning_rate": 5.319452552377246e-05, "loss": 0.0095, "step": 152200 }, { "epoch": 1.65, "learning_rate": 5.3178309658169554e-05, "loss": 0.0081, "step": 152210 }, { "epoch": 1.65, "learning_rate": 5.3162093792566646e-05, "loss": 0.0059, "step": 152220 }, { "epoch": 1.65, "learning_rate": 5.314587792696374e-05, "loss": 0.0058, "step": 152230 }, { "epoch": 1.65, "learning_rate": 5.312966206136083e-05, "loss": 0.007, "step": 152240 }, { "epoch": 1.65, "learning_rate": 5.3113446195757925e-05, "loss": 0.009, "step": 152250 }, { "epoch": 1.65, "learning_rate": 5.3097230330155024e-05, "loss": 0.0074, "step": 152260 }, { "epoch": 1.65, "learning_rate": 5.308101446455212e-05, "loss": 0.0055, "step": 152270 }, { "epoch": 1.65, "learning_rate": 5.306479859894921e-05, "loss": 0.0062, "step": 152280 }, { "epoch": 1.65, "learning_rate": 5.30485827333463e-05, "loss": 0.0088, "step": 152290 }, { "epoch": 1.65, "learning_rate": 5.3032366867743395e-05, "loss": 0.0083, "step": 152300 }, { "epoch": 1.65, "learning_rate": 5.3016151002140495e-05, "loss": 0.0086, "step": 152310 }, { "epoch": 1.65, "learning_rate": 5.299993513653759e-05, "loss": 0.0063, "step": 152320 }, { "epoch": 1.65, "learning_rate": 5.298371927093468e-05, "loss": 0.007, "step": 152330 }, { "epoch": 1.65, "learning_rate": 5.296750340533177e-05, "loss": 0.0104, "step": 152340 }, { "epoch": 1.65, "learning_rate": 5.2951287539728866e-05, "loss": 0.0096, "step": 152350 }, { "epoch": 1.65, "learning_rate": 5.2935071674125965e-05, "loss": 0.0083, "step": 152360 }, { "epoch": 1.65, "learning_rate": 5.291885580852306e-05, "loss": 0.0082, "step": 152370 }, { "epoch": 1.65, "learning_rate": 5.290263994292015e-05, "loss": 0.0075, "step": 152380 }, { "epoch": 1.65, "learning_rate": 5.288642407731724e-05, "loss": 0.0065, "step": 152390 }, { "epoch": 1.65, "learning_rate": 5.2870208211714336e-05, "loss": 0.0067, "step": 152400 }, { "epoch": 1.65, "learning_rate": 5.285399234611143e-05, "loss": 0.0076, "step": 152410 }, { "epoch": 1.65, "learning_rate": 5.283777648050853e-05, "loss": 0.0087, "step": 152420 }, { "epoch": 1.65, "learning_rate": 5.282156061490562e-05, "loss": 0.0075, "step": 152430 }, { "epoch": 1.65, "learning_rate": 5.2805344749302714e-05, "loss": 0.0089, "step": 152440 }, { "epoch": 1.65, "learning_rate": 5.2789128883699807e-05, "loss": 0.006, "step": 152450 }, { "epoch": 1.65, "learning_rate": 5.27729130180969e-05, "loss": 0.007, "step": 152460 }, { "epoch": 1.65, "learning_rate": 5.2756697152494e-05, "loss": 0.0088, "step": 152470 }, { "epoch": 1.65, "learning_rate": 5.274048128689109e-05, "loss": 0.0076, "step": 152480 }, { "epoch": 1.65, "learning_rate": 5.2724265421288184e-05, "loss": 0.0067, "step": 152490 }, { "epoch": 1.65, "learning_rate": 5.270804955568528e-05, "loss": 0.009, "step": 152500 }, { "epoch": 1.65, "learning_rate": 5.269183369008237e-05, "loss": 0.0066, "step": 152510 }, { "epoch": 1.65, "learning_rate": 5.267561782447946e-05, "loss": 0.0064, "step": 152520 }, { "epoch": 1.65, "learning_rate": 5.265940195887656e-05, "loss": 0.0073, "step": 152530 }, { "epoch": 1.65, "learning_rate": 5.2643186093273655e-05, "loss": 0.009, "step": 152540 }, { "epoch": 1.65, "learning_rate": 5.262697022767075e-05, "loss": 0.0078, "step": 152550 }, { "epoch": 1.65, "learning_rate": 5.261075436206784e-05, "loss": 0.0101, "step": 152560 }, { "epoch": 1.65, "learning_rate": 5.259453849646493e-05, "loss": 0.0093, "step": 152570 }, { "epoch": 1.65, "learning_rate": 5.257832263086203e-05, "loss": 0.0081, "step": 152580 }, { "epoch": 1.65, "learning_rate": 5.2562106765259125e-05, "loss": 0.0062, "step": 152590 }, { "epoch": 1.65, "learning_rate": 5.254589089965622e-05, "loss": 0.0084, "step": 152600 }, { "epoch": 1.65, "learning_rate": 5.252967503405331e-05, "loss": 0.0076, "step": 152610 }, { "epoch": 1.65, "learning_rate": 5.2513459168450404e-05, "loss": 0.0066, "step": 152620 }, { "epoch": 1.65, "learning_rate": 5.24972433028475e-05, "loss": 0.0073, "step": 152630 }, { "epoch": 1.65, "learning_rate": 5.2481027437244596e-05, "loss": 0.0068, "step": 152640 }, { "epoch": 1.65, "learning_rate": 5.246481157164169e-05, "loss": 0.0081, "step": 152650 }, { "epoch": 1.65, "learning_rate": 5.244859570603878e-05, "loss": 0.0073, "step": 152660 }, { "epoch": 1.65, "learning_rate": 5.2432379840435874e-05, "loss": 0.0089, "step": 152670 }, { "epoch": 1.65, "learning_rate": 5.241616397483297e-05, "loss": 0.0072, "step": 152680 }, { "epoch": 1.65, "learning_rate": 5.2399948109230066e-05, "loss": 0.0094, "step": 152690 }, { "epoch": 1.65, "learning_rate": 5.238373224362716e-05, "loss": 0.0086, "step": 152700 }, { "epoch": 1.65, "learning_rate": 5.236751637802425e-05, "loss": 0.0082, "step": 152710 }, { "epoch": 1.65, "learning_rate": 5.2351300512421345e-05, "loss": 0.0067, "step": 152720 }, { "epoch": 1.65, "learning_rate": 5.233508464681844e-05, "loss": 0.0108, "step": 152730 }, { "epoch": 1.65, "learning_rate": 5.231886878121554e-05, "loss": 0.0067, "step": 152740 }, { "epoch": 1.65, "learning_rate": 5.230265291561263e-05, "loss": 0.0082, "step": 152750 }, { "epoch": 1.65, "learning_rate": 5.228643705000972e-05, "loss": 0.0065, "step": 152760 }, { "epoch": 1.65, "learning_rate": 5.2270221184406815e-05, "loss": 0.008, "step": 152770 }, { "epoch": 1.65, "learning_rate": 5.225400531880391e-05, "loss": 0.0096, "step": 152780 }, { "epoch": 1.65, "learning_rate": 5.2237789453201e-05, "loss": 0.01, "step": 152790 }, { "epoch": 1.65, "learning_rate": 5.22215735875981e-05, "loss": 0.009, "step": 152800 }, { "epoch": 1.65, "learning_rate": 5.220535772199519e-05, "loss": 0.0068, "step": 152810 }, { "epoch": 1.65, "learning_rate": 5.2189141856392286e-05, "loss": 0.0072, "step": 152820 }, { "epoch": 1.65, "learning_rate": 5.217292599078938e-05, "loss": 0.0093, "step": 152830 }, { "epoch": 1.65, "learning_rate": 5.215671012518647e-05, "loss": 0.0061, "step": 152840 }, { "epoch": 1.65, "learning_rate": 5.214049425958357e-05, "loss": 0.0077, "step": 152850 }, { "epoch": 1.65, "learning_rate": 5.212427839398067e-05, "loss": 0.0066, "step": 152860 }, { "epoch": 1.65, "learning_rate": 5.210806252837776e-05, "loss": 0.0062, "step": 152870 }, { "epoch": 1.65, "learning_rate": 5.2091846662774856e-05, "loss": 0.0077, "step": 152880 }, { "epoch": 1.65, "learning_rate": 5.2075630797171955e-05, "loss": 0.0062, "step": 152890 }, { "epoch": 1.65, "learning_rate": 5.205941493156905e-05, "loss": 0.0048, "step": 152900 }, { "epoch": 1.65, "learning_rate": 5.204319906596614e-05, "loss": 0.0046, "step": 152910 }, { "epoch": 1.65, "learning_rate": 5.202698320036323e-05, "loss": 0.0083, "step": 152920 }, { "epoch": 1.65, "learning_rate": 5.2010767334760326e-05, "loss": 0.0081, "step": 152930 }, { "epoch": 1.65, "learning_rate": 5.1994551469157426e-05, "loss": 0.0073, "step": 152940 }, { "epoch": 1.65, "learning_rate": 5.197833560355452e-05, "loss": 0.0084, "step": 152950 }, { "epoch": 1.65, "learning_rate": 5.196211973795161e-05, "loss": 0.0067, "step": 152960 }, { "epoch": 1.65, "learning_rate": 5.1945903872348704e-05, "loss": 0.0082, "step": 152970 }, { "epoch": 1.65, "learning_rate": 5.1929688006745797e-05, "loss": 0.0064, "step": 152980 }, { "epoch": 1.65, "learning_rate": 5.191347214114289e-05, "loss": 0.0059, "step": 152990 }, { "epoch": 1.65, "learning_rate": 5.189725627553999e-05, "loss": 0.0066, "step": 153000 }, { "epoch": 1.65, "eval_cer": 0.9215121682588159, "eval_loss": 0.005926909390836954, "eval_runtime": 121.2098, "eval_samples_per_second": 16.5, "eval_steps_per_second": 4.125, "step": 153000 }, { "epoch": 1.65, "learning_rate": 5.188104040993708e-05, "loss": 0.0058, "step": 153010 }, { "epoch": 1.65, "learning_rate": 5.1864824544334174e-05, "loss": 0.0089, "step": 153020 }, { "epoch": 1.65, "learning_rate": 5.184860867873127e-05, "loss": 0.0054, "step": 153030 }, { "epoch": 1.65, "learning_rate": 5.183239281312836e-05, "loss": 0.0085, "step": 153040 }, { "epoch": 1.65, "learning_rate": 5.181617694752546e-05, "loss": 0.0052, "step": 153050 }, { "epoch": 1.65, "learning_rate": 5.179996108192255e-05, "loss": 0.0091, "step": 153060 }, { "epoch": 1.65, "learning_rate": 5.1783745216319645e-05, "loss": 0.0069, "step": 153070 }, { "epoch": 1.65, "learning_rate": 5.176752935071674e-05, "loss": 0.0049, "step": 153080 }, { "epoch": 1.65, "learning_rate": 5.175131348511383e-05, "loss": 0.0066, "step": 153090 }, { "epoch": 1.66, "learning_rate": 5.173509761951092e-05, "loss": 0.0072, "step": 153100 }, { "epoch": 1.66, "learning_rate": 5.171888175390802e-05, "loss": 0.0091, "step": 153110 }, { "epoch": 1.66, "learning_rate": 5.1702665888305115e-05, "loss": 0.0068, "step": 153120 }, { "epoch": 1.66, "learning_rate": 5.168645002270221e-05, "loss": 0.0065, "step": 153130 }, { "epoch": 1.66, "learning_rate": 5.16702341570993e-05, "loss": 0.0063, "step": 153140 }, { "epoch": 1.66, "learning_rate": 5.1654018291496393e-05, "loss": 0.0062, "step": 153150 }, { "epoch": 1.66, "learning_rate": 5.163780242589349e-05, "loss": 0.006, "step": 153160 }, { "epoch": 1.66, "learning_rate": 5.1621586560290586e-05, "loss": 0.0085, "step": 153170 }, { "epoch": 1.66, "learning_rate": 5.160537069468768e-05, "loss": 0.0095, "step": 153180 }, { "epoch": 1.66, "learning_rate": 5.158915482908477e-05, "loss": 0.0072, "step": 153190 }, { "epoch": 1.66, "learning_rate": 5.1572938963481864e-05, "loss": 0.0076, "step": 153200 }, { "epoch": 1.66, "learning_rate": 5.1556723097878963e-05, "loss": 0.0079, "step": 153210 }, { "epoch": 1.66, "learning_rate": 5.1540507232276056e-05, "loss": 0.0099, "step": 153220 }, { "epoch": 1.66, "learning_rate": 5.152429136667315e-05, "loss": 0.0077, "step": 153230 }, { "epoch": 1.66, "learning_rate": 5.150807550107024e-05, "loss": 0.0067, "step": 153240 }, { "epoch": 1.66, "learning_rate": 5.1491859635467334e-05, "loss": 0.007, "step": 153250 }, { "epoch": 1.66, "learning_rate": 5.147564376986443e-05, "loss": 0.0093, "step": 153260 }, { "epoch": 1.66, "learning_rate": 5.145942790426153e-05, "loss": 0.0056, "step": 153270 }, { "epoch": 1.66, "learning_rate": 5.144321203865862e-05, "loss": 0.008, "step": 153280 }, { "epoch": 1.66, "learning_rate": 5.142699617305571e-05, "loss": 0.0066, "step": 153290 }, { "epoch": 1.66, "learning_rate": 5.1410780307452805e-05, "loss": 0.0108, "step": 153300 }, { "epoch": 1.66, "learning_rate": 5.13945644418499e-05, "loss": 0.012, "step": 153310 }, { "epoch": 1.66, "learning_rate": 5.1378348576247e-05, "loss": 0.0076, "step": 153320 }, { "epoch": 1.66, "learning_rate": 5.136213271064409e-05, "loss": 0.0072, "step": 153330 }, { "epoch": 1.66, "learning_rate": 5.134591684504118e-05, "loss": 0.0092, "step": 153340 }, { "epoch": 1.66, "learning_rate": 5.1329700979438275e-05, "loss": 0.0066, "step": 153350 }, { "epoch": 1.66, "learning_rate": 5.131348511383537e-05, "loss": 0.0066, "step": 153360 }, { "epoch": 1.66, "learning_rate": 5.129726924823246e-05, "loss": 0.006, "step": 153370 }, { "epoch": 1.66, "learning_rate": 5.128105338262956e-05, "loss": 0.0063, "step": 153380 }, { "epoch": 1.66, "learning_rate": 5.126483751702665e-05, "loss": 0.0074, "step": 153390 }, { "epoch": 1.66, "learning_rate": 5.1248621651423746e-05, "loss": 0.0083, "step": 153400 }, { "epoch": 1.66, "learning_rate": 5.123240578582084e-05, "loss": 0.0053, "step": 153410 }, { "epoch": 1.66, "learning_rate": 5.121618992021793e-05, "loss": 0.0081, "step": 153420 }, { "epoch": 1.66, "learning_rate": 5.119997405461503e-05, "loss": 0.0085, "step": 153430 }, { "epoch": 1.66, "learning_rate": 5.1183758189012124e-05, "loss": 0.0064, "step": 153440 }, { "epoch": 1.66, "learning_rate": 5.1167542323409216e-05, "loss": 0.0077, "step": 153450 }, { "epoch": 1.66, "learning_rate": 5.115132645780631e-05, "loss": 0.0072, "step": 153460 }, { "epoch": 1.66, "learning_rate": 5.11351105922034e-05, "loss": 0.0058, "step": 153470 }, { "epoch": 1.66, "learning_rate": 5.11188947266005e-05, "loss": 0.0051, "step": 153480 }, { "epoch": 1.66, "learning_rate": 5.1102678860997594e-05, "loss": 0.0073, "step": 153490 }, { "epoch": 1.66, "learning_rate": 5.108646299539469e-05, "loss": 0.0071, "step": 153500 }, { "epoch": 1.66, "learning_rate": 5.107024712979178e-05, "loss": 0.0077, "step": 153510 }, { "epoch": 1.66, "learning_rate": 5.105403126418887e-05, "loss": 0.0078, "step": 153520 }, { "epoch": 1.66, "learning_rate": 5.1037815398585965e-05, "loss": 0.008, "step": 153530 }, { "epoch": 1.66, "learning_rate": 5.1021599532983065e-05, "loss": 0.0079, "step": 153540 }, { "epoch": 1.66, "learning_rate": 5.100538366738016e-05, "loss": 0.0065, "step": 153550 }, { "epoch": 1.66, "learning_rate": 5.098916780177725e-05, "loss": 0.0072, "step": 153560 }, { "epoch": 1.66, "learning_rate": 5.097295193617434e-05, "loss": 0.0063, "step": 153570 }, { "epoch": 1.66, "learning_rate": 5.095673607057145e-05, "loss": 0.008, "step": 153580 }, { "epoch": 1.66, "learning_rate": 5.094052020496854e-05, "loss": 0.006, "step": 153590 }, { "epoch": 1.66, "learning_rate": 5.0924304339365635e-05, "loss": 0.007, "step": 153600 }, { "epoch": 1.66, "learning_rate": 5.090808847376273e-05, "loss": 0.0068, "step": 153610 }, { "epoch": 1.66, "learning_rate": 5.089187260815982e-05, "loss": 0.0071, "step": 153620 }, { "epoch": 1.66, "learning_rate": 5.087565674255692e-05, "loss": 0.0065, "step": 153630 }, { "epoch": 1.66, "learning_rate": 5.085944087695401e-05, "loss": 0.0075, "step": 153640 }, { "epoch": 1.66, "learning_rate": 5.0843225011351105e-05, "loss": 0.006, "step": 153650 }, { "epoch": 1.66, "learning_rate": 5.08270091457482e-05, "loss": 0.0076, "step": 153660 }, { "epoch": 1.66, "learning_rate": 5.081079328014529e-05, "loss": 0.0068, "step": 153670 }, { "epoch": 1.66, "learning_rate": 5.0794577414542383e-05, "loss": 0.0095, "step": 153680 }, { "epoch": 1.66, "learning_rate": 5.077836154893948e-05, "loss": 0.0076, "step": 153690 }, { "epoch": 1.66, "learning_rate": 5.0762145683336576e-05, "loss": 0.0078, "step": 153700 }, { "epoch": 1.66, "learning_rate": 5.074592981773367e-05, "loss": 0.0077, "step": 153710 }, { "epoch": 1.66, "learning_rate": 5.072971395213076e-05, "loss": 0.0081, "step": 153720 }, { "epoch": 1.66, "learning_rate": 5.0713498086527854e-05, "loss": 0.0082, "step": 153730 }, { "epoch": 1.66, "learning_rate": 5.0697282220924953e-05, "loss": 0.008, "step": 153740 }, { "epoch": 1.66, "learning_rate": 5.0681066355322046e-05, "loss": 0.0076, "step": 153750 }, { "epoch": 1.66, "learning_rate": 5.066485048971914e-05, "loss": 0.0075, "step": 153760 }, { "epoch": 1.66, "learning_rate": 5.064863462411623e-05, "loss": 0.0066, "step": 153770 }, { "epoch": 1.66, "learning_rate": 5.0632418758513324e-05, "loss": 0.0078, "step": 153780 }, { "epoch": 1.66, "learning_rate": 5.0616202892910424e-05, "loss": 0.0095, "step": 153790 }, { "epoch": 1.66, "learning_rate": 5.059998702730752e-05, "loss": 0.0062, "step": 153800 }, { "epoch": 1.66, "learning_rate": 5.058377116170461e-05, "loss": 0.0071, "step": 153810 }, { "epoch": 1.66, "learning_rate": 5.05675552961017e-05, "loss": 0.0081, "step": 153820 }, { "epoch": 1.66, "learning_rate": 5.0551339430498795e-05, "loss": 0.0074, "step": 153830 }, { "epoch": 1.66, "learning_rate": 5.053512356489589e-05, "loss": 0.0063, "step": 153840 }, { "epoch": 1.66, "learning_rate": 5.051890769929299e-05, "loss": 0.0061, "step": 153850 }, { "epoch": 1.66, "learning_rate": 5.050269183369008e-05, "loss": 0.0073, "step": 153860 }, { "epoch": 1.66, "learning_rate": 5.048647596808717e-05, "loss": 0.009, "step": 153870 }, { "epoch": 1.66, "learning_rate": 5.0470260102484265e-05, "loss": 0.0092, "step": 153880 }, { "epoch": 1.66, "learning_rate": 5.045404423688136e-05, "loss": 0.0075, "step": 153890 }, { "epoch": 1.66, "learning_rate": 5.043782837127846e-05, "loss": 0.0077, "step": 153900 }, { "epoch": 1.66, "learning_rate": 5.042161250567555e-05, "loss": 0.0095, "step": 153910 }, { "epoch": 1.66, "learning_rate": 5.040539664007264e-05, "loss": 0.0073, "step": 153920 }, { "epoch": 1.66, "learning_rate": 5.0389180774469736e-05, "loss": 0.0068, "step": 153930 }, { "epoch": 1.66, "learning_rate": 5.037296490886683e-05, "loss": 0.0058, "step": 153940 }, { "epoch": 1.66, "learning_rate": 5.035674904326393e-05, "loss": 0.0066, "step": 153950 }, { "epoch": 1.66, "learning_rate": 5.034053317766102e-05, "loss": 0.0071, "step": 153960 }, { "epoch": 1.66, "learning_rate": 5.0324317312058114e-05, "loss": 0.0097, "step": 153970 }, { "epoch": 1.66, "learning_rate": 5.0308101446455206e-05, "loss": 0.0078, "step": 153980 }, { "epoch": 1.66, "learning_rate": 5.02918855808523e-05, "loss": 0.0064, "step": 153990 }, { "epoch": 1.66, "learning_rate": 5.027566971524939e-05, "loss": 0.0076, "step": 154000 }, { "epoch": 1.66, "eval_cer": 0.9215251973031615, "eval_loss": 0.005830066278576851, "eval_runtime": 121.2077, "eval_samples_per_second": 16.501, "eval_steps_per_second": 4.125, "step": 154000 }, { "epoch": 1.66, "learning_rate": 5.025945384964649e-05, "loss": 0.0058, "step": 154010 }, { "epoch": 1.67, "learning_rate": 5.0243237984043584e-05, "loss": 0.0093, "step": 154020 }, { "epoch": 1.67, "learning_rate": 5.022702211844068e-05, "loss": 0.0053, "step": 154030 }, { "epoch": 1.67, "learning_rate": 5.021080625283777e-05, "loss": 0.0063, "step": 154040 }, { "epoch": 1.67, "learning_rate": 5.019459038723486e-05, "loss": 0.006, "step": 154050 }, { "epoch": 1.67, "learning_rate": 5.017837452163196e-05, "loss": 0.0091, "step": 154060 }, { "epoch": 1.67, "learning_rate": 5.0162158656029055e-05, "loss": 0.0072, "step": 154070 }, { "epoch": 1.67, "learning_rate": 5.014594279042615e-05, "loss": 0.0075, "step": 154080 }, { "epoch": 1.67, "learning_rate": 5.012972692482324e-05, "loss": 0.0084, "step": 154090 }, { "epoch": 1.67, "learning_rate": 5.011351105922033e-05, "loss": 0.0091, "step": 154100 }, { "epoch": 1.67, "learning_rate": 5.0097295193617426e-05, "loss": 0.0071, "step": 154110 }, { "epoch": 1.67, "learning_rate": 5.0081079328014525e-05, "loss": 0.01, "step": 154120 }, { "epoch": 1.67, "learning_rate": 5.006486346241162e-05, "loss": 0.0084, "step": 154130 }, { "epoch": 1.67, "learning_rate": 5.004864759680871e-05, "loss": 0.0074, "step": 154140 }, { "epoch": 1.67, "learning_rate": 5.00324317312058e-05, "loss": 0.0076, "step": 154150 }, { "epoch": 1.67, "learning_rate": 5.0016215865602896e-05, "loss": 0.0114, "step": 154160 }, { "epoch": 1.67, "learning_rate": 4.9999999999999996e-05, "loss": 0.0064, "step": 154170 }, { "epoch": 1.67, "learning_rate": 4.998378413439709e-05, "loss": 0.0069, "step": 154180 }, { "epoch": 1.67, "learning_rate": 4.996756826879418e-05, "loss": 0.0063, "step": 154190 }, { "epoch": 1.67, "learning_rate": 4.9951352403191274e-05, "loss": 0.0066, "step": 154200 }, { "epoch": 1.67, "learning_rate": 4.9935136537588367e-05, "loss": 0.0058, "step": 154210 }, { "epoch": 1.67, "learning_rate": 4.9918920671985466e-05, "loss": 0.0072, "step": 154220 }, { "epoch": 1.67, "learning_rate": 4.990270480638256e-05, "loss": 0.0066, "step": 154230 }, { "epoch": 1.67, "learning_rate": 4.988648894077965e-05, "loss": 0.0064, "step": 154240 }, { "epoch": 1.67, "learning_rate": 4.9870273075176744e-05, "loss": 0.0067, "step": 154250 }, { "epoch": 1.67, "learning_rate": 4.985405720957384e-05, "loss": 0.0092, "step": 154260 }, { "epoch": 1.67, "learning_rate": 4.983784134397093e-05, "loss": 0.0084, "step": 154270 }, { "epoch": 1.67, "learning_rate": 4.982162547836803e-05, "loss": 0.0078, "step": 154280 }, { "epoch": 1.67, "learning_rate": 4.980540961276513e-05, "loss": 0.0089, "step": 154290 }, { "epoch": 1.67, "learning_rate": 4.978919374716222e-05, "loss": 0.006, "step": 154300 }, { "epoch": 1.67, "learning_rate": 4.9772977881559314e-05, "loss": 0.009, "step": 154310 }, { "epoch": 1.67, "learning_rate": 4.9756762015956414e-05, "loss": 0.0066, "step": 154320 }, { "epoch": 1.67, "learning_rate": 4.974054615035351e-05, "loss": 0.0083, "step": 154330 }, { "epoch": 1.67, "learning_rate": 4.97243302847506e-05, "loss": 0.0054, "step": 154340 }, { "epoch": 1.67, "learning_rate": 4.970811441914769e-05, "loss": 0.0095, "step": 154350 }, { "epoch": 1.67, "learning_rate": 4.9691898553544785e-05, "loss": 0.0058, "step": 154360 }, { "epoch": 1.67, "learning_rate": 4.9675682687941884e-05, "loss": 0.0059, "step": 154370 }, { "epoch": 1.67, "learning_rate": 4.965946682233898e-05, "loss": 0.0062, "step": 154380 }, { "epoch": 1.67, "learning_rate": 4.964325095673607e-05, "loss": 0.0069, "step": 154390 }, { "epoch": 1.67, "learning_rate": 4.962703509113316e-05, "loss": 0.0064, "step": 154400 }, { "epoch": 1.67, "learning_rate": 4.9610819225530255e-05, "loss": 0.0064, "step": 154410 }, { "epoch": 1.67, "learning_rate": 4.959460335992735e-05, "loss": 0.0059, "step": 154420 }, { "epoch": 1.67, "learning_rate": 4.957838749432445e-05, "loss": 0.0063, "step": 154430 }, { "epoch": 1.67, "learning_rate": 4.956217162872154e-05, "loss": 0.0062, "step": 154440 }, { "epoch": 1.67, "learning_rate": 4.954595576311863e-05, "loss": 0.0087, "step": 154450 }, { "epoch": 1.67, "learning_rate": 4.9529739897515726e-05, "loss": 0.006, "step": 154460 }, { "epoch": 1.67, "learning_rate": 4.951352403191282e-05, "loss": 0.007, "step": 154470 }, { "epoch": 1.67, "learning_rate": 4.949730816630992e-05, "loss": 0.0076, "step": 154480 }, { "epoch": 1.67, "learning_rate": 4.948109230070701e-05, "loss": 0.0095, "step": 154490 }, { "epoch": 1.67, "learning_rate": 4.9464876435104104e-05, "loss": 0.0048, "step": 154500 }, { "epoch": 1.67, "learning_rate": 4.9448660569501196e-05, "loss": 0.0058, "step": 154510 }, { "epoch": 1.67, "learning_rate": 4.943244470389829e-05, "loss": 0.0073, "step": 154520 }, { "epoch": 1.67, "learning_rate": 4.941622883829539e-05, "loss": 0.0063, "step": 154530 }, { "epoch": 1.67, "learning_rate": 4.940001297269248e-05, "loss": 0.0074, "step": 154540 }, { "epoch": 1.67, "learning_rate": 4.9383797107089574e-05, "loss": 0.0061, "step": 154550 }, { "epoch": 1.67, "learning_rate": 4.936758124148667e-05, "loss": 0.0073, "step": 154560 }, { "epoch": 1.67, "learning_rate": 4.935136537588376e-05, "loss": 0.0072, "step": 154570 }, { "epoch": 1.67, "learning_rate": 4.933514951028085e-05, "loss": 0.0073, "step": 154580 }, { "epoch": 1.67, "learning_rate": 4.931893364467795e-05, "loss": 0.0067, "step": 154590 }, { "epoch": 1.67, "learning_rate": 4.9302717779075045e-05, "loss": 0.0075, "step": 154600 }, { "epoch": 1.67, "learning_rate": 4.928650191347214e-05, "loss": 0.0062, "step": 154610 }, { "epoch": 1.67, "learning_rate": 4.927028604786923e-05, "loss": 0.0064, "step": 154620 }, { "epoch": 1.67, "learning_rate": 4.925407018226632e-05, "loss": 0.0079, "step": 154630 }, { "epoch": 1.67, "learning_rate": 4.923785431666342e-05, "loss": 0.0056, "step": 154640 }, { "epoch": 1.67, "learning_rate": 4.9221638451060515e-05, "loss": 0.0078, "step": 154650 }, { "epoch": 1.67, "learning_rate": 4.920542258545761e-05, "loss": 0.006, "step": 154660 }, { "epoch": 1.67, "learning_rate": 4.91892067198547e-05, "loss": 0.009, "step": 154670 }, { "epoch": 1.67, "learning_rate": 4.917299085425179e-05, "loss": 0.0066, "step": 154680 }, { "epoch": 1.67, "learning_rate": 4.9156774988648886e-05, "loss": 0.0079, "step": 154690 }, { "epoch": 1.67, "learning_rate": 4.9140559123045986e-05, "loss": 0.01, "step": 154700 }, { "epoch": 1.67, "learning_rate": 4.912434325744308e-05, "loss": 0.0079, "step": 154710 }, { "epoch": 1.67, "learning_rate": 4.910812739184017e-05, "loss": 0.008, "step": 154720 }, { "epoch": 1.67, "learning_rate": 4.9091911526237264e-05, "loss": 0.007, "step": 154730 }, { "epoch": 1.67, "learning_rate": 4.9075695660634357e-05, "loss": 0.0075, "step": 154740 }, { "epoch": 1.67, "learning_rate": 4.9059479795031456e-05, "loss": 0.0085, "step": 154750 }, { "epoch": 1.67, "learning_rate": 4.904326392942855e-05, "loss": 0.0061, "step": 154760 }, { "epoch": 1.67, "learning_rate": 4.902704806382564e-05, "loss": 0.0062, "step": 154770 }, { "epoch": 1.67, "learning_rate": 4.9010832198222734e-05, "loss": 0.0119, "step": 154780 }, { "epoch": 1.67, "learning_rate": 4.899461633261983e-05, "loss": 0.0081, "step": 154790 }, { "epoch": 1.67, "learning_rate": 4.8978400467016927e-05, "loss": 0.008, "step": 154800 }, { "epoch": 1.67, "learning_rate": 4.896218460141402e-05, "loss": 0.0071, "step": 154810 }, { "epoch": 1.67, "learning_rate": 4.894596873581111e-05, "loss": 0.0064, "step": 154820 }, { "epoch": 1.67, "learning_rate": 4.8929752870208205e-05, "loss": 0.0058, "step": 154830 }, { "epoch": 1.67, "learning_rate": 4.89135370046053e-05, "loss": 0.0061, "step": 154840 }, { "epoch": 1.67, "learning_rate": 4.889732113900239e-05, "loss": 0.0079, "step": 154850 }, { "epoch": 1.67, "learning_rate": 4.888110527339949e-05, "loss": 0.0079, "step": 154860 }, { "epoch": 1.67, "learning_rate": 4.886488940779658e-05, "loss": 0.007, "step": 154870 }, { "epoch": 1.67, "learning_rate": 4.8848673542193675e-05, "loss": 0.0093, "step": 154880 }, { "epoch": 1.67, "learning_rate": 4.883245767659077e-05, "loss": 0.0079, "step": 154890 }, { "epoch": 1.67, "learning_rate": 4.881624181098786e-05, "loss": 0.0052, "step": 154900 }, { "epoch": 1.67, "learning_rate": 4.880002594538496e-05, "loss": 0.0064, "step": 154910 }, { "epoch": 1.67, "learning_rate": 4.878381007978205e-05, "loss": 0.0085, "step": 154920 }, { "epoch": 1.67, "learning_rate": 4.8767594214179146e-05, "loss": 0.0063, "step": 154930 }, { "epoch": 1.67, "learning_rate": 4.875137834857624e-05, "loss": 0.0088, "step": 154940 }, { "epoch": 1.68, "learning_rate": 4.873516248297333e-05, "loss": 0.0059, "step": 154950 }, { "epoch": 1.68, "learning_rate": 4.8718946617370424e-05, "loss": 0.0051, "step": 154960 }, { "epoch": 1.68, "learning_rate": 4.8702730751767524e-05, "loss": 0.0062, "step": 154970 }, { "epoch": 1.68, "learning_rate": 4.8686514886164616e-05, "loss": 0.0085, "step": 154980 }, { "epoch": 1.68, "learning_rate": 4.867029902056171e-05, "loss": 0.0069, "step": 154990 }, { "epoch": 1.68, "learning_rate": 4.86540831549588e-05, "loss": 0.0073, "step": 155000 }, { "epoch": 1.68, "eval_cer": 0.9215251973031615, "eval_loss": 0.005951076280325651, "eval_runtime": 121.1875, "eval_samples_per_second": 16.503, "eval_steps_per_second": 4.126, "step": 155000 }, { "epoch": 1.68, "learning_rate": 4.863786728935591e-05, "loss": 0.0102, "step": 155010 }, { "epoch": 1.68, "learning_rate": 4.8621651423753e-05, "loss": 0.0067, "step": 155020 }, { "epoch": 1.68, "learning_rate": 4.8605435558150094e-05, "loss": 0.008, "step": 155030 }, { "epoch": 1.68, "learning_rate": 4.8589219692547186e-05, "loss": 0.0062, "step": 155040 }, { "epoch": 1.68, "learning_rate": 4.857300382694428e-05, "loss": 0.0069, "step": 155050 }, { "epoch": 1.68, "learning_rate": 4.855678796134138e-05, "loss": 0.0069, "step": 155060 }, { "epoch": 1.68, "learning_rate": 4.854057209573847e-05, "loss": 0.007, "step": 155070 }, { "epoch": 1.68, "learning_rate": 4.8524356230135564e-05, "loss": 0.0069, "step": 155080 }, { "epoch": 1.68, "learning_rate": 4.850814036453266e-05, "loss": 0.0062, "step": 155090 }, { "epoch": 1.68, "learning_rate": 4.849192449892975e-05, "loss": 0.007, "step": 155100 }, { "epoch": 1.68, "learning_rate": 4.847570863332685e-05, "loss": 0.006, "step": 155110 }, { "epoch": 1.68, "learning_rate": 4.845949276772394e-05, "loss": 0.008, "step": 155120 }, { "epoch": 1.68, "learning_rate": 4.8443276902121035e-05, "loss": 0.0076, "step": 155130 }, { "epoch": 1.68, "learning_rate": 4.842706103651813e-05, "loss": 0.0064, "step": 155140 }, { "epoch": 1.68, "learning_rate": 4.841084517091522e-05, "loss": 0.007, "step": 155150 }, { "epoch": 1.68, "learning_rate": 4.839462930531231e-05, "loss": 0.007, "step": 155160 }, { "epoch": 1.68, "learning_rate": 4.837841343970941e-05, "loss": 0.005, "step": 155170 }, { "epoch": 1.68, "learning_rate": 4.8362197574106505e-05, "loss": 0.0083, "step": 155180 }, { "epoch": 1.68, "learning_rate": 4.83459817085036e-05, "loss": 0.0067, "step": 155190 }, { "epoch": 1.68, "learning_rate": 4.832976584290069e-05, "loss": 0.0097, "step": 155200 }, { "epoch": 1.68, "learning_rate": 4.831354997729778e-05, "loss": 0.0068, "step": 155210 }, { "epoch": 1.68, "learning_rate": 4.829733411169488e-05, "loss": 0.0103, "step": 155220 }, { "epoch": 1.68, "learning_rate": 4.8281118246091976e-05, "loss": 0.0084, "step": 155230 }, { "epoch": 1.68, "learning_rate": 4.826490238048907e-05, "loss": 0.0091, "step": 155240 }, { "epoch": 1.68, "learning_rate": 4.824868651488616e-05, "loss": 0.0071, "step": 155250 }, { "epoch": 1.68, "learning_rate": 4.8232470649283254e-05, "loss": 0.0093, "step": 155260 }, { "epoch": 1.68, "learning_rate": 4.8216254783680346e-05, "loss": 0.006, "step": 155270 }, { "epoch": 1.68, "learning_rate": 4.8200038918077446e-05, "loss": 0.0057, "step": 155280 }, { "epoch": 1.68, "learning_rate": 4.818382305247454e-05, "loss": 0.0059, "step": 155290 }, { "epoch": 1.68, "learning_rate": 4.816760718687163e-05, "loss": 0.0056, "step": 155300 }, { "epoch": 1.68, "learning_rate": 4.8151391321268724e-05, "loss": 0.0067, "step": 155310 }, { "epoch": 1.68, "learning_rate": 4.813517545566582e-05, "loss": 0.0104, "step": 155320 }, { "epoch": 1.68, "learning_rate": 4.8118959590062916e-05, "loss": 0.0062, "step": 155330 }, { "epoch": 1.68, "learning_rate": 4.810274372446001e-05, "loss": 0.0075, "step": 155340 }, { "epoch": 1.68, "learning_rate": 4.80865278588571e-05, "loss": 0.0069, "step": 155350 }, { "epoch": 1.68, "learning_rate": 4.8070311993254195e-05, "loss": 0.008, "step": 155360 }, { "epoch": 1.68, "learning_rate": 4.805409612765129e-05, "loss": 0.0085, "step": 155370 }, { "epoch": 1.68, "learning_rate": 4.803788026204839e-05, "loss": 0.0073, "step": 155380 }, { "epoch": 1.68, "learning_rate": 4.802166439644548e-05, "loss": 0.0088, "step": 155390 }, { "epoch": 1.68, "learning_rate": 4.800544853084257e-05, "loss": 0.0053, "step": 155400 }, { "epoch": 1.68, "learning_rate": 4.7989232665239665e-05, "loss": 0.0073, "step": 155410 }, { "epoch": 1.68, "learning_rate": 4.797301679963676e-05, "loss": 0.007, "step": 155420 }, { "epoch": 1.68, "learning_rate": 4.795680093403385e-05, "loss": 0.007, "step": 155430 }, { "epoch": 1.68, "learning_rate": 4.794058506843095e-05, "loss": 0.0059, "step": 155440 }, { "epoch": 1.68, "learning_rate": 4.792436920282804e-05, "loss": 0.0101, "step": 155450 }, { "epoch": 1.68, "learning_rate": 4.7908153337225136e-05, "loss": 0.0081, "step": 155460 }, { "epoch": 1.68, "learning_rate": 4.789193747162223e-05, "loss": 0.0069, "step": 155470 }, { "epoch": 1.68, "learning_rate": 4.787572160601932e-05, "loss": 0.0068, "step": 155480 }, { "epoch": 1.68, "learning_rate": 4.785950574041642e-05, "loss": 0.0084, "step": 155490 }, { "epoch": 1.68, "learning_rate": 4.7843289874813513e-05, "loss": 0.0072, "step": 155500 }, { "epoch": 1.68, "learning_rate": 4.7827074009210606e-05, "loss": 0.0078, "step": 155510 }, { "epoch": 1.68, "learning_rate": 4.78108581436077e-05, "loss": 0.0053, "step": 155520 }, { "epoch": 1.68, "learning_rate": 4.779464227800479e-05, "loss": 0.0068, "step": 155530 }, { "epoch": 1.68, "learning_rate": 4.777842641240189e-05, "loss": 0.005, "step": 155540 }, { "epoch": 1.68, "learning_rate": 4.7762210546798984e-05, "loss": 0.0074, "step": 155550 }, { "epoch": 1.68, "learning_rate": 4.774599468119608e-05, "loss": 0.0066, "step": 155560 }, { "epoch": 1.68, "learning_rate": 4.772977881559317e-05, "loss": 0.007, "step": 155570 }, { "epoch": 1.68, "learning_rate": 4.771356294999026e-05, "loss": 0.0076, "step": 155580 }, { "epoch": 1.68, "learning_rate": 4.7697347084387355e-05, "loss": 0.007, "step": 155590 }, { "epoch": 1.68, "learning_rate": 4.7681131218784454e-05, "loss": 0.0064, "step": 155600 }, { "epoch": 1.68, "learning_rate": 4.766491535318155e-05, "loss": 0.0093, "step": 155610 }, { "epoch": 1.68, "learning_rate": 4.764869948757864e-05, "loss": 0.0083, "step": 155620 }, { "epoch": 1.68, "learning_rate": 4.763248362197573e-05, "loss": 0.0065, "step": 155630 }, { "epoch": 1.68, "learning_rate": 4.7616267756372825e-05, "loss": 0.0075, "step": 155640 }, { "epoch": 1.68, "learning_rate": 4.7600051890769925e-05, "loss": 0.0072, "step": 155650 }, { "epoch": 1.68, "learning_rate": 4.758383602516702e-05, "loss": 0.0076, "step": 155660 }, { "epoch": 1.68, "learning_rate": 4.756762015956411e-05, "loss": 0.0085, "step": 155670 }, { "epoch": 1.68, "learning_rate": 4.75514042939612e-05, "loss": 0.0085, "step": 155680 }, { "epoch": 1.68, "learning_rate": 4.7535188428358296e-05, "loss": 0.009, "step": 155690 }, { "epoch": 1.68, "learning_rate": 4.751897256275539e-05, "loss": 0.0062, "step": 155700 }, { "epoch": 1.68, "learning_rate": 4.750275669715249e-05, "loss": 0.0069, "step": 155710 }, { "epoch": 1.68, "learning_rate": 4.748654083154958e-05, "loss": 0.0077, "step": 155720 }, { "epoch": 1.68, "learning_rate": 4.747032496594668e-05, "loss": 0.0073, "step": 155730 }, { "epoch": 1.68, "learning_rate": 4.745410910034377e-05, "loss": 0.0079, "step": 155740 }, { "epoch": 1.68, "learning_rate": 4.743789323474087e-05, "loss": 0.0075, "step": 155750 }, { "epoch": 1.68, "learning_rate": 4.7421677369137965e-05, "loss": 0.0091, "step": 155760 }, { "epoch": 1.68, "learning_rate": 4.740546150353506e-05, "loss": 0.0057, "step": 155770 }, { "epoch": 1.68, "learning_rate": 4.738924563793215e-05, "loss": 0.0068, "step": 155780 }, { "epoch": 1.68, "learning_rate": 4.7373029772329244e-05, "loss": 0.0077, "step": 155790 }, { "epoch": 1.68, "learning_rate": 4.735681390672634e-05, "loss": 0.0076, "step": 155800 }, { "epoch": 1.68, "learning_rate": 4.7340598041123436e-05, "loss": 0.0063, "step": 155810 }, { "epoch": 1.68, "learning_rate": 4.732438217552053e-05, "loss": 0.0072, "step": 155820 }, { "epoch": 1.68, "learning_rate": 4.730816630991762e-05, "loss": 0.009, "step": 155830 }, { "epoch": 1.68, "learning_rate": 4.7291950444314714e-05, "loss": 0.0064, "step": 155840 }, { "epoch": 1.68, "learning_rate": 4.727573457871181e-05, "loss": 0.0066, "step": 155850 }, { "epoch": 1.68, "learning_rate": 4.7259518713108906e-05, "loss": 0.0078, "step": 155860 }, { "epoch": 1.69, "learning_rate": 4.7243302847506e-05, "loss": 0.006, "step": 155870 }, { "epoch": 1.69, "learning_rate": 4.722708698190309e-05, "loss": 0.0077, "step": 155880 }, { "epoch": 1.69, "learning_rate": 4.7210871116300185e-05, "loss": 0.0071, "step": 155890 }, { "epoch": 1.69, "learning_rate": 4.719465525069728e-05, "loss": 0.0067, "step": 155900 }, { "epoch": 1.69, "learning_rate": 4.717843938509438e-05, "loss": 0.0072, "step": 155910 }, { "epoch": 1.69, "learning_rate": 4.716222351949147e-05, "loss": 0.0076, "step": 155920 }, { "epoch": 1.69, "learning_rate": 4.714600765388856e-05, "loss": 0.0054, "step": 155930 }, { "epoch": 1.69, "learning_rate": 4.7129791788285655e-05, "loss": 0.0043, "step": 155940 }, { "epoch": 1.69, "learning_rate": 4.711357592268275e-05, "loss": 0.0061, "step": 155950 }, { "epoch": 1.69, "learning_rate": 4.709736005707985e-05, "loss": 0.008, "step": 155960 }, { "epoch": 1.69, "learning_rate": 4.708114419147694e-05, "loss": 0.0075, "step": 155970 }, { "epoch": 1.69, "learning_rate": 4.706492832587403e-05, "loss": 0.008, "step": 155980 }, { "epoch": 1.69, "learning_rate": 4.7048712460271126e-05, "loss": 0.0066, "step": 155990 }, { "epoch": 1.69, "learning_rate": 4.703249659466822e-05, "loss": 0.0118, "step": 156000 }, { "epoch": 1.69, "eval_cer": 0.9215477809800273, "eval_loss": 0.006024594884365797, "eval_runtime": 121.1774, "eval_samples_per_second": 16.505, "eval_steps_per_second": 4.126, "step": 156000 }, { "epoch": 1.69, "learning_rate": 4.701628072906531e-05, "loss": 0.0061, "step": 156010 }, { "epoch": 1.69, "learning_rate": 4.700006486346241e-05, "loss": 0.0076, "step": 156020 }, { "epoch": 1.69, "learning_rate": 4.6983848997859503e-05, "loss": 0.0091, "step": 156030 }, { "epoch": 1.69, "learning_rate": 4.6967633132256596e-05, "loss": 0.005, "step": 156040 }, { "epoch": 1.69, "learning_rate": 4.695141726665369e-05, "loss": 0.0066, "step": 156050 }, { "epoch": 1.69, "learning_rate": 4.693520140105078e-05, "loss": 0.0083, "step": 156060 }, { "epoch": 1.69, "learning_rate": 4.691898553544788e-05, "loss": 0.007, "step": 156070 }, { "epoch": 1.69, "learning_rate": 4.6902769669844974e-05, "loss": 0.0082, "step": 156080 }, { "epoch": 1.69, "learning_rate": 4.688655380424207e-05, "loss": 0.0073, "step": 156090 }, { "epoch": 1.69, "learning_rate": 4.687033793863916e-05, "loss": 0.0079, "step": 156100 }, { "epoch": 1.69, "learning_rate": 4.685412207303625e-05, "loss": 0.007, "step": 156110 }, { "epoch": 1.69, "learning_rate": 4.683790620743335e-05, "loss": 0.0074, "step": 156120 }, { "epoch": 1.69, "learning_rate": 4.6821690341830444e-05, "loss": 0.0071, "step": 156130 }, { "epoch": 1.69, "learning_rate": 4.680547447622754e-05, "loss": 0.0076, "step": 156140 }, { "epoch": 1.69, "learning_rate": 4.678925861062463e-05, "loss": 0.007, "step": 156150 }, { "epoch": 1.69, "learning_rate": 4.677304274502172e-05, "loss": 0.0079, "step": 156160 }, { "epoch": 1.69, "learning_rate": 4.6756826879418815e-05, "loss": 0.0062, "step": 156170 }, { "epoch": 1.69, "learning_rate": 4.6740611013815915e-05, "loss": 0.0066, "step": 156180 }, { "epoch": 1.69, "learning_rate": 4.672439514821301e-05, "loss": 0.0085, "step": 156190 }, { "epoch": 1.69, "learning_rate": 4.67081792826101e-05, "loss": 0.0061, "step": 156200 }, { "epoch": 1.69, "learning_rate": 4.669196341700719e-05, "loss": 0.0054, "step": 156210 }, { "epoch": 1.69, "learning_rate": 4.6675747551404286e-05, "loss": 0.0058, "step": 156220 }, { "epoch": 1.69, "learning_rate": 4.6659531685801385e-05, "loss": 0.0081, "step": 156230 }, { "epoch": 1.69, "learning_rate": 4.664331582019848e-05, "loss": 0.0069, "step": 156240 }, { "epoch": 1.69, "learning_rate": 4.662709995459557e-05, "loss": 0.0078, "step": 156250 }, { "epoch": 1.69, "learning_rate": 4.6610884088992664e-05, "loss": 0.0063, "step": 156260 }, { "epoch": 1.69, "learning_rate": 4.6594668223389756e-05, "loss": 0.0054, "step": 156270 }, { "epoch": 1.69, "learning_rate": 4.657845235778685e-05, "loss": 0.0066, "step": 156280 }, { "epoch": 1.69, "learning_rate": 4.656223649218395e-05, "loss": 0.0065, "step": 156290 }, { "epoch": 1.69, "learning_rate": 4.654602062658104e-05, "loss": 0.0085, "step": 156300 }, { "epoch": 1.69, "learning_rate": 4.6529804760978134e-05, "loss": 0.0053, "step": 156310 }, { "epoch": 1.69, "learning_rate": 4.651358889537523e-05, "loss": 0.0051, "step": 156320 }, { "epoch": 1.69, "learning_rate": 4.649737302977232e-05, "loss": 0.0065, "step": 156330 }, { "epoch": 1.69, "learning_rate": 4.648115716416942e-05, "loss": 0.0072, "step": 156340 }, { "epoch": 1.69, "learning_rate": 4.646494129856651e-05, "loss": 0.0062, "step": 156350 }, { "epoch": 1.69, "learning_rate": 4.6448725432963605e-05, "loss": 0.0059, "step": 156360 }, { "epoch": 1.69, "learning_rate": 4.64325095673607e-05, "loss": 0.0088, "step": 156370 }, { "epoch": 1.69, "learning_rate": 4.641629370175779e-05, "loss": 0.0073, "step": 156380 }, { "epoch": 1.69, "learning_rate": 4.640007783615489e-05, "loss": 0.0097, "step": 156390 }, { "epoch": 1.69, "learning_rate": 4.638386197055198e-05, "loss": 0.0099, "step": 156400 }, { "epoch": 1.69, "learning_rate": 4.6367646104949075e-05, "loss": 0.0048, "step": 156410 }, { "epoch": 1.69, "learning_rate": 4.635143023934617e-05, "loss": 0.0095, "step": 156420 }, { "epoch": 1.69, "learning_rate": 4.633521437374326e-05, "loss": 0.0069, "step": 156430 }, { "epoch": 1.69, "learning_rate": 4.631899850814035e-05, "loss": 0.0051, "step": 156440 }, { "epoch": 1.69, "learning_rate": 4.630278264253746e-05, "loss": 0.0073, "step": 156450 }, { "epoch": 1.69, "learning_rate": 4.628656677693455e-05, "loss": 0.0077, "step": 156460 }, { "epoch": 1.69, "learning_rate": 4.6270350911331645e-05, "loss": 0.0071, "step": 156470 }, { "epoch": 1.69, "learning_rate": 4.625413504572874e-05, "loss": 0.0065, "step": 156480 }, { "epoch": 1.69, "learning_rate": 4.623791918012584e-05, "loss": 0.0106, "step": 156490 }, { "epoch": 1.69, "learning_rate": 4.622170331452293e-05, "loss": 0.0067, "step": 156500 }, { "epoch": 1.69, "learning_rate": 4.620548744892002e-05, "loss": 0.0065, "step": 156510 }, { "epoch": 1.69, "learning_rate": 4.6189271583317116e-05, "loss": 0.0084, "step": 156520 }, { "epoch": 1.69, "learning_rate": 4.617305571771421e-05, "loss": 0.0086, "step": 156530 }, { "epoch": 1.69, "learning_rate": 4.615683985211131e-05, "loss": 0.0078, "step": 156540 }, { "epoch": 1.69, "learning_rate": 4.61406239865084e-05, "loss": 0.0076, "step": 156550 }, { "epoch": 1.69, "learning_rate": 4.612440812090549e-05, "loss": 0.0065, "step": 156560 }, { "epoch": 1.69, "learning_rate": 4.6108192255302586e-05, "loss": 0.0066, "step": 156570 }, { "epoch": 1.69, "learning_rate": 4.609197638969968e-05, "loss": 0.0056, "step": 156580 }, { "epoch": 1.69, "learning_rate": 4.607576052409677e-05, "loss": 0.0089, "step": 156590 }, { "epoch": 1.69, "learning_rate": 4.605954465849387e-05, "loss": 0.0081, "step": 156600 }, { "epoch": 1.69, "learning_rate": 4.6043328792890964e-05, "loss": 0.0096, "step": 156610 }, { "epoch": 1.69, "learning_rate": 4.6027112927288057e-05, "loss": 0.009, "step": 156620 }, { "epoch": 1.69, "learning_rate": 4.601089706168515e-05, "loss": 0.0081, "step": 156630 }, { "epoch": 1.69, "learning_rate": 4.599468119608224e-05, "loss": 0.0057, "step": 156640 }, { "epoch": 1.69, "learning_rate": 4.597846533047934e-05, "loss": 0.0076, "step": 156650 }, { "epoch": 1.69, "learning_rate": 4.5962249464876434e-05, "loss": 0.0068, "step": 156660 }, { "epoch": 1.69, "learning_rate": 4.594603359927353e-05, "loss": 0.0061, "step": 156670 }, { "epoch": 1.69, "learning_rate": 4.592981773367062e-05, "loss": 0.0073, "step": 156680 }, { "epoch": 1.69, "learning_rate": 4.591360186806771e-05, "loss": 0.0118, "step": 156690 }, { "epoch": 1.69, "learning_rate": 4.589738600246481e-05, "loss": 0.0066, "step": 156700 }, { "epoch": 1.69, "learning_rate": 4.5881170136861905e-05, "loss": 0.0092, "step": 156710 }, { "epoch": 1.69, "learning_rate": 4.5864954271259e-05, "loss": 0.0075, "step": 156720 }, { "epoch": 1.69, "learning_rate": 4.584873840565609e-05, "loss": 0.0065, "step": 156730 }, { "epoch": 1.69, "learning_rate": 4.583252254005318e-05, "loss": 0.0058, "step": 156740 }, { "epoch": 1.69, "learning_rate": 4.5816306674450276e-05, "loss": 0.0065, "step": 156750 }, { "epoch": 1.69, "learning_rate": 4.5800090808847375e-05, "loss": 0.0076, "step": 156760 }, { "epoch": 1.69, "learning_rate": 4.578387494324447e-05, "loss": 0.0064, "step": 156770 }, { "epoch": 1.69, "learning_rate": 4.576765907764156e-05, "loss": 0.0081, "step": 156780 }, { "epoch": 1.69, "learning_rate": 4.5751443212038654e-05, "loss": 0.0058, "step": 156790 }, { "epoch": 1.7, "learning_rate": 4.5735227346435746e-05, "loss": 0.0068, "step": 156800 }, { "epoch": 1.7, "learning_rate": 4.5719011480832846e-05, "loss": 0.0062, "step": 156810 }, { "epoch": 1.7, "learning_rate": 4.570279561522994e-05, "loss": 0.0066, "step": 156820 }, { "epoch": 1.7, "learning_rate": 4.568657974962703e-05, "loss": 0.0061, "step": 156830 }, { "epoch": 1.7, "learning_rate": 4.5670363884024124e-05, "loss": 0.0054, "step": 156840 }, { "epoch": 1.7, "learning_rate": 4.565414801842122e-05, "loss": 0.0065, "step": 156850 }, { "epoch": 1.7, "learning_rate": 4.563793215281831e-05, "loss": 0.0066, "step": 156860 }, { "epoch": 1.7, "learning_rate": 4.562171628721541e-05, "loss": 0.0105, "step": 156870 }, { "epoch": 1.7, "learning_rate": 4.56055004216125e-05, "loss": 0.0081, "step": 156880 }, { "epoch": 1.7, "learning_rate": 4.5589284556009595e-05, "loss": 0.0071, "step": 156890 }, { "epoch": 1.7, "learning_rate": 4.557306869040669e-05, "loss": 0.007, "step": 156900 }, { "epoch": 1.7, "learning_rate": 4.555685282480378e-05, "loss": 0.0058, "step": 156910 }, { "epoch": 1.7, "learning_rate": 4.554063695920088e-05, "loss": 0.0073, "step": 156920 }, { "epoch": 1.7, "learning_rate": 4.552442109359797e-05, "loss": 0.0061, "step": 156930 }, { "epoch": 1.7, "learning_rate": 4.5508205227995065e-05, "loss": 0.0081, "step": 156940 }, { "epoch": 1.7, "learning_rate": 4.549198936239216e-05, "loss": 0.007, "step": 156950 }, { "epoch": 1.7, "learning_rate": 4.547577349678925e-05, "loss": 0.0063, "step": 156960 }, { "epoch": 1.7, "learning_rate": 4.545955763118635e-05, "loss": 0.0052, "step": 156970 }, { "epoch": 1.7, "learning_rate": 4.544334176558344e-05, "loss": 0.006, "step": 156980 }, { "epoch": 1.7, "learning_rate": 4.5427125899980536e-05, "loss": 0.0066, "step": 156990 }, { "epoch": 1.7, "learning_rate": 4.541091003437763e-05, "loss": 0.0058, "step": 157000 }, { "epoch": 1.7, "eval_cer": 0.9215112996558595, "eval_loss": 0.005920048803091049, "eval_runtime": 121.2838, "eval_samples_per_second": 16.49, "eval_steps_per_second": 4.123, "step": 157000 }, { "epoch": 1.7, "learning_rate": 4.539469416877472e-05, "loss": 0.0075, "step": 157010 }, { "epoch": 1.7, "learning_rate": 4.5378478303171814e-05, "loss": 0.0054, "step": 157020 }, { "epoch": 1.7, "learning_rate": 4.536226243756891e-05, "loss": 0.0072, "step": 157030 }, { "epoch": 1.7, "learning_rate": 4.5346046571966006e-05, "loss": 0.0065, "step": 157040 }, { "epoch": 1.7, "learning_rate": 4.53298307063631e-05, "loss": 0.0075, "step": 157050 }, { "epoch": 1.7, "learning_rate": 4.531361484076019e-05, "loss": 0.0052, "step": 157060 }, { "epoch": 1.7, "learning_rate": 4.5297398975157284e-05, "loss": 0.0071, "step": 157070 }, { "epoch": 1.7, "learning_rate": 4.5281183109554384e-05, "loss": 0.0064, "step": 157080 }, { "epoch": 1.7, "learning_rate": 4.5264967243951477e-05, "loss": 0.0077, "step": 157090 }, { "epoch": 1.7, "learning_rate": 4.524875137834857e-05, "loss": 0.0072, "step": 157100 }, { "epoch": 1.7, "learning_rate": 4.523253551274566e-05, "loss": 0.0054, "step": 157110 }, { "epoch": 1.7, "learning_rate": 4.5216319647142755e-05, "loss": 0.006, "step": 157120 }, { "epoch": 1.7, "learning_rate": 4.5200103781539854e-05, "loss": 0.0071, "step": 157130 }, { "epoch": 1.7, "learning_rate": 4.518388791593695e-05, "loss": 0.0069, "step": 157140 }, { "epoch": 1.7, "learning_rate": 4.516767205033404e-05, "loss": 0.009, "step": 157150 }, { "epoch": 1.7, "learning_rate": 4.515145618473113e-05, "loss": 0.0073, "step": 157160 }, { "epoch": 1.7, "learning_rate": 4.513524031912823e-05, "loss": 0.0065, "step": 157170 }, { "epoch": 1.7, "learning_rate": 4.511902445352533e-05, "loss": 0.0072, "step": 157180 }, { "epoch": 1.7, "learning_rate": 4.5102808587922424e-05, "loss": 0.0066, "step": 157190 }, { "epoch": 1.7, "learning_rate": 4.508659272231952e-05, "loss": 0.0082, "step": 157200 }, { "epoch": 1.7, "learning_rate": 4.507037685671661e-05, "loss": 0.008, "step": 157210 }, { "epoch": 1.7, "learning_rate": 4.50541609911137e-05, "loss": 0.0072, "step": 157220 }, { "epoch": 1.7, "learning_rate": 4.50379451255108e-05, "loss": 0.0059, "step": 157230 }, { "epoch": 1.7, "learning_rate": 4.5021729259907895e-05, "loss": 0.0082, "step": 157240 }, { "epoch": 1.7, "learning_rate": 4.500551339430499e-05, "loss": 0.0083, "step": 157250 }, { "epoch": 1.7, "learning_rate": 4.498929752870208e-05, "loss": 0.0077, "step": 157260 }, { "epoch": 1.7, "learning_rate": 4.497308166309917e-05, "loss": 0.0071, "step": 157270 }, { "epoch": 1.7, "learning_rate": 4.495686579749627e-05, "loss": 0.0086, "step": 157280 }, { "epoch": 1.7, "learning_rate": 4.4940649931893365e-05, "loss": 0.007, "step": 157290 }, { "epoch": 1.7, "learning_rate": 4.492443406629046e-05, "loss": 0.007, "step": 157300 }, { "epoch": 1.7, "learning_rate": 4.490821820068755e-05, "loss": 0.0075, "step": 157310 }, { "epoch": 1.7, "learning_rate": 4.4892002335084643e-05, "loss": 0.0067, "step": 157320 }, { "epoch": 1.7, "learning_rate": 4.4875786469481736e-05, "loss": 0.0084, "step": 157330 }, { "epoch": 1.7, "learning_rate": 4.4859570603878836e-05, "loss": 0.0088, "step": 157340 }, { "epoch": 1.7, "learning_rate": 4.484335473827593e-05, "loss": 0.0067, "step": 157350 }, { "epoch": 1.7, "learning_rate": 4.482713887267302e-05, "loss": 0.0077, "step": 157360 }, { "epoch": 1.7, "learning_rate": 4.4810923007070114e-05, "loss": 0.0077, "step": 157370 }, { "epoch": 1.7, "learning_rate": 4.479470714146721e-05, "loss": 0.0101, "step": 157380 }, { "epoch": 1.7, "learning_rate": 4.4778491275864306e-05, "loss": 0.0064, "step": 157390 }, { "epoch": 1.7, "learning_rate": 4.47622754102614e-05, "loss": 0.0061, "step": 157400 }, { "epoch": 1.7, "learning_rate": 4.474605954465849e-05, "loss": 0.0067, "step": 157410 }, { "epoch": 1.7, "learning_rate": 4.4729843679055584e-05, "loss": 0.0103, "step": 157420 }, { "epoch": 1.7, "learning_rate": 4.471362781345268e-05, "loss": 0.0052, "step": 157430 }, { "epoch": 1.7, "learning_rate": 4.469741194784977e-05, "loss": 0.0071, "step": 157440 }, { "epoch": 1.7, "learning_rate": 4.468119608224687e-05, "loss": 0.0077, "step": 157450 }, { "epoch": 1.7, "learning_rate": 4.466498021664396e-05, "loss": 0.0066, "step": 157460 }, { "epoch": 1.7, "learning_rate": 4.4648764351041055e-05, "loss": 0.0061, "step": 157470 }, { "epoch": 1.7, "learning_rate": 4.463254848543815e-05, "loss": 0.005, "step": 157480 }, { "epoch": 1.7, "learning_rate": 4.461633261983524e-05, "loss": 0.0078, "step": 157490 }, { "epoch": 1.7, "learning_rate": 4.460011675423234e-05, "loss": 0.0063, "step": 157500 }, { "epoch": 1.7, "learning_rate": 4.458390088862943e-05, "loss": 0.0062, "step": 157510 }, { "epoch": 1.7, "learning_rate": 4.4567685023026525e-05, "loss": 0.0074, "step": 157520 }, { "epoch": 1.7, "learning_rate": 4.455146915742362e-05, "loss": 0.007, "step": 157530 }, { "epoch": 1.7, "learning_rate": 4.453525329182071e-05, "loss": 0.0082, "step": 157540 }, { "epoch": 1.7, "learning_rate": 4.451903742621781e-05, "loss": 0.0079, "step": 157550 }, { "epoch": 1.7, "learning_rate": 4.45028215606149e-05, "loss": 0.0046, "step": 157560 }, { "epoch": 1.7, "learning_rate": 4.4486605695011996e-05, "loss": 0.0089, "step": 157570 }, { "epoch": 1.7, "learning_rate": 4.447038982940909e-05, "loss": 0.0074, "step": 157580 }, { "epoch": 1.7, "learning_rate": 4.445417396380618e-05, "loss": 0.0082, "step": 157590 }, { "epoch": 1.7, "learning_rate": 4.4437958098203274e-05, "loss": 0.0069, "step": 157600 }, { "epoch": 1.7, "learning_rate": 4.4421742232600374e-05, "loss": 0.0065, "step": 157610 }, { "epoch": 1.7, "learning_rate": 4.4405526366997466e-05, "loss": 0.0068, "step": 157620 }, { "epoch": 1.7, "learning_rate": 4.438931050139456e-05, "loss": 0.0081, "step": 157630 }, { "epoch": 1.7, "learning_rate": 4.437309463579165e-05, "loss": 0.0074, "step": 157640 }, { "epoch": 1.7, "learning_rate": 4.4356878770188745e-05, "loss": 0.009, "step": 157650 }, { "epoch": 1.7, "learning_rate": 4.4340662904585844e-05, "loss": 0.0053, "step": 157660 }, { "epoch": 1.7, "learning_rate": 4.432444703898294e-05, "loss": 0.006, "step": 157670 }, { "epoch": 1.7, "learning_rate": 4.430823117338003e-05, "loss": 0.0059, "step": 157680 }, { "epoch": 1.7, "learning_rate": 4.429201530777712e-05, "loss": 0.0075, "step": 157690 }, { "epoch": 1.7, "learning_rate": 4.4275799442174215e-05, "loss": 0.007, "step": 157700 }, { "epoch": 1.7, "learning_rate": 4.4259583576571315e-05, "loss": 0.0052, "step": 157710 }, { "epoch": 1.71, "learning_rate": 4.424336771096841e-05, "loss": 0.0053, "step": 157720 }, { "epoch": 1.71, "learning_rate": 4.42271518453655e-05, "loss": 0.0053, "step": 157730 }, { "epoch": 1.71, "learning_rate": 4.421093597976259e-05, "loss": 0.0056, "step": 157740 }, { "epoch": 1.71, "learning_rate": 4.4194720114159686e-05, "loss": 0.0057, "step": 157750 }, { "epoch": 1.71, "learning_rate": 4.417850424855678e-05, "loss": 0.0051, "step": 157760 }, { "epoch": 1.71, "learning_rate": 4.416228838295388e-05, "loss": 0.007, "step": 157770 }, { "epoch": 1.71, "learning_rate": 4.414607251735097e-05, "loss": 0.0081, "step": 157780 }, { "epoch": 1.71, "learning_rate": 4.4129856651748063e-05, "loss": 0.0074, "step": 157790 }, { "epoch": 1.71, "learning_rate": 4.4113640786145156e-05, "loss": 0.005, "step": 157800 }, { "epoch": 1.71, "learning_rate": 4.409742492054225e-05, "loss": 0.0057, "step": 157810 }, { "epoch": 1.71, "learning_rate": 4.408120905493935e-05, "loss": 0.0063, "step": 157820 }, { "epoch": 1.71, "learning_rate": 4.406499318933644e-05, "loss": 0.0057, "step": 157830 }, { "epoch": 1.71, "learning_rate": 4.4048777323733534e-05, "loss": 0.0068, "step": 157840 }, { "epoch": 1.71, "learning_rate": 4.403256145813063e-05, "loss": 0.0048, "step": 157850 }, { "epoch": 1.71, "learning_rate": 4.401634559252772e-05, "loss": 0.0066, "step": 157860 }, { "epoch": 1.71, "learning_rate": 4.400012972692481e-05, "loss": 0.0105, "step": 157870 }, { "epoch": 1.71, "learning_rate": 4.398391386132191e-05, "loss": 0.0063, "step": 157880 }, { "epoch": 1.71, "learning_rate": 4.396769799571901e-05, "loss": 0.0086, "step": 157890 }, { "epoch": 1.71, "learning_rate": 4.3951482130116104e-05, "loss": 0.006, "step": 157900 }, { "epoch": 1.71, "learning_rate": 4.39352662645132e-05, "loss": 0.0076, "step": 157910 }, { "epoch": 1.71, "learning_rate": 4.3919050398910296e-05, "loss": 0.0075, "step": 157920 }, { "epoch": 1.71, "learning_rate": 4.390283453330739e-05, "loss": 0.0112, "step": 157930 }, { "epoch": 1.71, "learning_rate": 4.388661866770448e-05, "loss": 0.0079, "step": 157940 }, { "epoch": 1.71, "learning_rate": 4.3870402802101574e-05, "loss": 0.0072, "step": 157950 }, { "epoch": 1.71, "learning_rate": 4.385418693649867e-05, "loss": 0.0058, "step": 157960 }, { "epoch": 1.71, "learning_rate": 4.383797107089577e-05, "loss": 0.0061, "step": 157970 }, { "epoch": 1.71, "learning_rate": 4.382175520529286e-05, "loss": 0.0082, "step": 157980 }, { "epoch": 1.71, "learning_rate": 4.380553933968995e-05, "loss": 0.0057, "step": 157990 }, { "epoch": 1.71, "learning_rate": 4.3789323474087045e-05, "loss": 0.0093, "step": 158000 }, { "epoch": 1.71, "eval_cer": 0.921521722891336, "eval_loss": 0.005824473220854998, "eval_runtime": 121.2769, "eval_samples_per_second": 16.491, "eval_steps_per_second": 4.123, "step": 158000 }, { "epoch": 1.71, "learning_rate": 4.377310760848414e-05, "loss": 0.0074, "step": 158010 }, { "epoch": 1.71, "learning_rate": 4.375689174288123e-05, "loss": 0.0083, "step": 158020 }, { "epoch": 1.71, "learning_rate": 4.374067587727833e-05, "loss": 0.0082, "step": 158030 }, { "epoch": 1.71, "learning_rate": 4.372446001167542e-05, "loss": 0.0069, "step": 158040 }, { "epoch": 1.71, "learning_rate": 4.3708244146072515e-05, "loss": 0.0076, "step": 158050 }, { "epoch": 1.71, "learning_rate": 4.369202828046961e-05, "loss": 0.0062, "step": 158060 }, { "epoch": 1.71, "learning_rate": 4.36758124148667e-05, "loss": 0.0085, "step": 158070 }, { "epoch": 1.71, "learning_rate": 4.36595965492638e-05, "loss": 0.0069, "step": 158080 }, { "epoch": 1.71, "learning_rate": 4.364338068366089e-05, "loss": 0.0071, "step": 158090 }, { "epoch": 1.71, "learning_rate": 4.3627164818057986e-05, "loss": 0.0069, "step": 158100 }, { "epoch": 1.71, "learning_rate": 4.361094895245508e-05, "loss": 0.0075, "step": 158110 }, { "epoch": 1.71, "learning_rate": 4.359473308685217e-05, "loss": 0.0068, "step": 158120 }, { "epoch": 1.71, "learning_rate": 4.357851722124927e-05, "loss": 0.0088, "step": 158130 }, { "epoch": 1.71, "learning_rate": 4.3562301355646364e-05, "loss": 0.0057, "step": 158140 }, { "epoch": 1.71, "learning_rate": 4.3546085490043456e-05, "loss": 0.0055, "step": 158150 }, { "epoch": 1.71, "learning_rate": 4.352986962444055e-05, "loss": 0.0072, "step": 158160 }, { "epoch": 1.71, "learning_rate": 4.351365375883764e-05, "loss": 0.007, "step": 158170 }, { "epoch": 1.71, "learning_rate": 4.3497437893234735e-05, "loss": 0.0062, "step": 158180 }, { "epoch": 1.71, "learning_rate": 4.3481222027631834e-05, "loss": 0.0069, "step": 158190 }, { "epoch": 1.71, "learning_rate": 4.346500616202893e-05, "loss": 0.0076, "step": 158200 }, { "epoch": 1.71, "learning_rate": 4.344879029642602e-05, "loss": 0.0063, "step": 158210 }, { "epoch": 1.71, "learning_rate": 4.343257443082311e-05, "loss": 0.0061, "step": 158220 }, { "epoch": 1.71, "learning_rate": 4.3416358565220205e-05, "loss": 0.0093, "step": 158230 }, { "epoch": 1.71, "learning_rate": 4.3400142699617305e-05, "loss": 0.0066, "step": 158240 }, { "epoch": 1.71, "learning_rate": 4.33839268340144e-05, "loss": 0.0061, "step": 158250 }, { "epoch": 1.71, "learning_rate": 4.336771096841149e-05, "loss": 0.0061, "step": 158260 }, { "epoch": 1.71, "learning_rate": 4.335149510280858e-05, "loss": 0.0086, "step": 158270 }, { "epoch": 1.71, "learning_rate": 4.3335279237205676e-05, "loss": 0.0064, "step": 158280 }, { "epoch": 1.71, "learning_rate": 4.3319063371602775e-05, "loss": 0.0082, "step": 158290 }, { "epoch": 1.71, "learning_rate": 4.330284750599987e-05, "loss": 0.0092, "step": 158300 }, { "epoch": 1.71, "learning_rate": 4.328663164039696e-05, "loss": 0.007, "step": 158310 }, { "epoch": 1.71, "learning_rate": 4.327041577479405e-05, "loss": 0.0085, "step": 158320 }, { "epoch": 1.71, "learning_rate": 4.3254199909191146e-05, "loss": 0.0068, "step": 158330 }, { "epoch": 1.71, "learning_rate": 4.323798404358824e-05, "loss": 0.007, "step": 158340 }, { "epoch": 1.71, "learning_rate": 4.322176817798534e-05, "loss": 0.0054, "step": 158350 }, { "epoch": 1.71, "learning_rate": 4.320555231238243e-05, "loss": 0.0058, "step": 158360 }, { "epoch": 1.71, "learning_rate": 4.3189336446779524e-05, "loss": 0.0059, "step": 158370 }, { "epoch": 1.71, "learning_rate": 4.3173120581176617e-05, "loss": 0.0065, "step": 158380 }, { "epoch": 1.71, "learning_rate": 4.315690471557371e-05, "loss": 0.0082, "step": 158390 }, { "epoch": 1.71, "learning_rate": 4.314068884997081e-05, "loss": 0.0064, "step": 158400 }, { "epoch": 1.71, "learning_rate": 4.31244729843679e-05, "loss": 0.0067, "step": 158410 }, { "epoch": 1.71, "learning_rate": 4.3108257118764994e-05, "loss": 0.0067, "step": 158420 }, { "epoch": 1.71, "learning_rate": 4.309204125316209e-05, "loss": 0.0054, "step": 158430 }, { "epoch": 1.71, "learning_rate": 4.307582538755918e-05, "loss": 0.0073, "step": 158440 }, { "epoch": 1.71, "learning_rate": 4.305960952195627e-05, "loss": 0.0076, "step": 158450 }, { "epoch": 1.71, "learning_rate": 4.304339365635337e-05, "loss": 0.0057, "step": 158460 }, { "epoch": 1.71, "learning_rate": 4.3027177790750465e-05, "loss": 0.0076, "step": 158470 }, { "epoch": 1.71, "learning_rate": 4.301096192514756e-05, "loss": 0.0077, "step": 158480 }, { "epoch": 1.71, "learning_rate": 4.299474605954465e-05, "loss": 0.0063, "step": 158490 }, { "epoch": 1.71, "learning_rate": 4.297853019394174e-05, "loss": 0.0097, "step": 158500 }, { "epoch": 1.71, "learning_rate": 4.296231432833884e-05, "loss": 0.0067, "step": 158510 }, { "epoch": 1.71, "learning_rate": 4.2946098462735935e-05, "loss": 0.0058, "step": 158520 }, { "epoch": 1.71, "learning_rate": 4.292988259713303e-05, "loss": 0.0062, "step": 158530 }, { "epoch": 1.71, "learning_rate": 4.291366673153012e-05, "loss": 0.0073, "step": 158540 }, { "epoch": 1.71, "learning_rate": 4.2897450865927214e-05, "loss": 0.0084, "step": 158550 }, { "epoch": 1.71, "learning_rate": 4.288123500032431e-05, "loss": 0.0059, "step": 158560 }, { "epoch": 1.71, "learning_rate": 4.2865019134721406e-05, "loss": 0.0067, "step": 158570 }, { "epoch": 1.71, "learning_rate": 4.28488032691185e-05, "loss": 0.0055, "step": 158580 }, { "epoch": 1.71, "learning_rate": 4.283258740351559e-05, "loss": 0.0069, "step": 158590 }, { "epoch": 1.71, "learning_rate": 4.2816371537912684e-05, "loss": 0.0071, "step": 158600 }, { "epoch": 1.71, "learning_rate": 4.280015567230979e-05, "loss": 0.0063, "step": 158610 }, { "epoch": 1.71, "learning_rate": 4.278393980670688e-05, "loss": 0.0083, "step": 158620 }, { "epoch": 1.71, "learning_rate": 4.2767723941103976e-05, "loss": 0.0071, "step": 158630 }, { "epoch": 1.71, "learning_rate": 4.275150807550107e-05, "loss": 0.0072, "step": 158640 }, { "epoch": 1.72, "learning_rate": 4.273529220989816e-05, "loss": 0.0064, "step": 158650 }, { "epoch": 1.72, "learning_rate": 4.271907634429526e-05, "loss": 0.0069, "step": 158660 }, { "epoch": 1.72, "learning_rate": 4.2702860478692354e-05, "loss": 0.0052, "step": 158670 }, { "epoch": 1.72, "learning_rate": 4.2686644613089446e-05, "loss": 0.0056, "step": 158680 }, { "epoch": 1.72, "learning_rate": 4.267042874748654e-05, "loss": 0.0065, "step": 158690 }, { "epoch": 1.72, "learning_rate": 4.265421288188363e-05, "loss": 0.0062, "step": 158700 }, { "epoch": 1.72, "learning_rate": 4.263799701628073e-05, "loss": 0.0074, "step": 158710 }, { "epoch": 1.72, "learning_rate": 4.2621781150677824e-05, "loss": 0.0068, "step": 158720 }, { "epoch": 1.72, "learning_rate": 4.260556528507492e-05, "loss": 0.0056, "step": 158730 }, { "epoch": 1.72, "learning_rate": 4.258934941947201e-05, "loss": 0.0073, "step": 158740 }, { "epoch": 1.72, "learning_rate": 4.25731335538691e-05, "loss": 0.0059, "step": 158750 }, { "epoch": 1.72, "learning_rate": 4.2556917688266195e-05, "loss": 0.0056, "step": 158760 }, { "epoch": 1.72, "learning_rate": 4.2540701822663295e-05, "loss": 0.0059, "step": 158770 }, { "epoch": 1.72, "learning_rate": 4.252448595706039e-05, "loss": 0.0101, "step": 158780 }, { "epoch": 1.72, "learning_rate": 4.250827009145748e-05, "loss": 0.0065, "step": 158790 }, { "epoch": 1.72, "learning_rate": 4.249205422585457e-05, "loss": 0.0073, "step": 158800 }, { "epoch": 1.72, "learning_rate": 4.2475838360251666e-05, "loss": 0.0089, "step": 158810 }, { "epoch": 1.72, "learning_rate": 4.2459622494648765e-05, "loss": 0.0095, "step": 158820 }, { "epoch": 1.72, "learning_rate": 4.244340662904586e-05, "loss": 0.0072, "step": 158830 }, { "epoch": 1.72, "learning_rate": 4.242719076344295e-05, "loss": 0.0074, "step": 158840 }, { "epoch": 1.72, "learning_rate": 4.241097489784004e-05, "loss": 0.0058, "step": 158850 }, { "epoch": 1.72, "learning_rate": 4.2394759032237136e-05, "loss": 0.0069, "step": 158860 }, { "epoch": 1.72, "learning_rate": 4.2378543166634236e-05, "loss": 0.0061, "step": 158870 }, { "epoch": 1.72, "learning_rate": 4.236232730103133e-05, "loss": 0.0085, "step": 158880 }, { "epoch": 1.72, "learning_rate": 4.234611143542842e-05, "loss": 0.007, "step": 158890 }, { "epoch": 1.72, "learning_rate": 4.2329895569825514e-05, "loss": 0.0059, "step": 158900 }, { "epoch": 1.72, "learning_rate": 4.2313679704222607e-05, "loss": 0.0057, "step": 158910 }, { "epoch": 1.72, "learning_rate": 4.22974638386197e-05, "loss": 0.0067, "step": 158920 }, { "epoch": 1.72, "learning_rate": 4.22812479730168e-05, "loss": 0.0086, "step": 158930 }, { "epoch": 1.72, "learning_rate": 4.226503210741389e-05, "loss": 0.0078, "step": 158940 }, { "epoch": 1.72, "learning_rate": 4.2248816241810984e-05, "loss": 0.0063, "step": 158950 }, { "epoch": 1.72, "learning_rate": 4.223260037620808e-05, "loss": 0.0058, "step": 158960 }, { "epoch": 1.72, "learning_rate": 4.221638451060517e-05, "loss": 0.0098, "step": 158970 }, { "epoch": 1.72, "learning_rate": 4.220016864500227e-05, "loss": 0.0069, "step": 158980 }, { "epoch": 1.72, "learning_rate": 4.218395277939936e-05, "loss": 0.0065, "step": 158990 }, { "epoch": 1.72, "learning_rate": 4.2167736913796455e-05, "loss": 0.0079, "step": 159000 }, { "epoch": 1.72, "eval_cer": 0.9215208542883797, "eval_loss": 0.005773806478828192, "eval_runtime": 121.1921, "eval_samples_per_second": 16.503, "eval_steps_per_second": 4.126, "step": 159000 }, { "epoch": 1.72, "learning_rate": 4.215152104819355e-05, "loss": 0.0073, "step": 159010 }, { "epoch": 1.72, "learning_rate": 4.213530518259064e-05, "loss": 0.0069, "step": 159020 }, { "epoch": 1.72, "learning_rate": 4.211908931698773e-05, "loss": 0.0086, "step": 159030 }, { "epoch": 1.72, "learning_rate": 4.210287345138483e-05, "loss": 0.0064, "step": 159040 }, { "epoch": 1.72, "learning_rate": 4.2086657585781925e-05, "loss": 0.0082, "step": 159050 }, { "epoch": 1.72, "learning_rate": 4.207044172017902e-05, "loss": 0.0056, "step": 159060 }, { "epoch": 1.72, "learning_rate": 4.205422585457611e-05, "loss": 0.0066, "step": 159070 }, { "epoch": 1.72, "learning_rate": 4.2038009988973204e-05, "loss": 0.0059, "step": 159080 }, { "epoch": 1.72, "learning_rate": 4.20217941233703e-05, "loss": 0.0072, "step": 159090 }, { "epoch": 1.72, "learning_rate": 4.2005578257767396e-05, "loss": 0.0059, "step": 159100 }, { "epoch": 1.72, "learning_rate": 4.198936239216449e-05, "loss": 0.008, "step": 159110 }, { "epoch": 1.72, "learning_rate": 4.197314652656158e-05, "loss": 0.008, "step": 159120 }, { "epoch": 1.72, "learning_rate": 4.1956930660958674e-05, "loss": 0.007, "step": 159130 }, { "epoch": 1.72, "learning_rate": 4.1940714795355774e-05, "loss": 0.0092, "step": 159140 }, { "epoch": 1.72, "learning_rate": 4.1924498929752866e-05, "loss": 0.0096, "step": 159150 }, { "epoch": 1.72, "learning_rate": 4.190828306414996e-05, "loss": 0.0055, "step": 159160 }, { "epoch": 1.72, "learning_rate": 4.189206719854705e-05, "loss": 0.0068, "step": 159170 }, { "epoch": 1.72, "learning_rate": 4.1875851332944144e-05, "loss": 0.0059, "step": 159180 }, { "epoch": 1.72, "learning_rate": 4.185963546734124e-05, "loss": 0.0066, "step": 159190 }, { "epoch": 1.72, "learning_rate": 4.184341960173834e-05, "loss": 0.0067, "step": 159200 }, { "epoch": 1.72, "learning_rate": 4.182720373613543e-05, "loss": 0.0088, "step": 159210 }, { "epoch": 1.72, "learning_rate": 4.181098787053252e-05, "loss": 0.0074, "step": 159220 }, { "epoch": 1.72, "learning_rate": 4.1794772004929615e-05, "loss": 0.0064, "step": 159230 }, { "epoch": 1.72, "learning_rate": 4.177855613932671e-05, "loss": 0.0077, "step": 159240 }, { "epoch": 1.72, "learning_rate": 4.176234027372381e-05, "loss": 0.0063, "step": 159250 }, { "epoch": 1.72, "learning_rate": 4.17461244081209e-05, "loss": 0.007, "step": 159260 }, { "epoch": 1.72, "learning_rate": 4.172990854251799e-05, "loss": 0.0087, "step": 159270 }, { "epoch": 1.72, "learning_rate": 4.1713692676915085e-05, "loss": 0.006, "step": 159280 }, { "epoch": 1.72, "learning_rate": 4.169747681131218e-05, "loss": 0.0069, "step": 159290 }, { "epoch": 1.72, "learning_rate": 4.168126094570928e-05, "loss": 0.0056, "step": 159300 }, { "epoch": 1.72, "learning_rate": 4.166504508010637e-05, "loss": 0.0064, "step": 159310 }, { "epoch": 1.72, "learning_rate": 4.164882921450346e-05, "loss": 0.0074, "step": 159320 }, { "epoch": 1.72, "learning_rate": 4.163261334890056e-05, "loss": 0.0057, "step": 159330 }, { "epoch": 1.72, "learning_rate": 4.1616397483297655e-05, "loss": 0.0071, "step": 159340 }, { "epoch": 1.72, "learning_rate": 4.1600181617694755e-05, "loss": 0.0067, "step": 159350 }, { "epoch": 1.72, "learning_rate": 4.158396575209185e-05, "loss": 0.0093, "step": 159360 }, { "epoch": 1.72, "learning_rate": 4.156774988648894e-05, "loss": 0.0083, "step": 159370 }, { "epoch": 1.72, "learning_rate": 4.155153402088603e-05, "loss": 0.0067, "step": 159380 }, { "epoch": 1.72, "learning_rate": 4.1535318155283126e-05, "loss": 0.007, "step": 159390 }, { "epoch": 1.72, "learning_rate": 4.1519102289680226e-05, "loss": 0.009, "step": 159400 }, { "epoch": 1.72, "learning_rate": 4.150288642407732e-05, "loss": 0.0057, "step": 159410 }, { "epoch": 1.72, "learning_rate": 4.148667055847441e-05, "loss": 0.007, "step": 159420 }, { "epoch": 1.72, "learning_rate": 4.1470454692871504e-05, "loss": 0.007, "step": 159430 }, { "epoch": 1.72, "learning_rate": 4.1454238827268596e-05, "loss": 0.0108, "step": 159440 }, { "epoch": 1.72, "learning_rate": 4.1438022961665696e-05, "loss": 0.0054, "step": 159450 }, { "epoch": 1.72, "learning_rate": 4.142180709606279e-05, "loss": 0.005, "step": 159460 }, { "epoch": 1.72, "learning_rate": 4.140559123045988e-05, "loss": 0.0082, "step": 159470 }, { "epoch": 1.72, "learning_rate": 4.1389375364856974e-05, "loss": 0.0066, "step": 159480 }, { "epoch": 1.72, "learning_rate": 4.137315949925407e-05, "loss": 0.0064, "step": 159490 }, { "epoch": 1.72, "learning_rate": 4.135694363365116e-05, "loss": 0.0051, "step": 159500 }, { "epoch": 1.72, "learning_rate": 4.134072776804826e-05, "loss": 0.0056, "step": 159510 }, { "epoch": 1.72, "learning_rate": 4.132451190244535e-05, "loss": 0.0108, "step": 159520 }, { "epoch": 1.72, "learning_rate": 4.1308296036842445e-05, "loss": 0.006, "step": 159530 }, { "epoch": 1.72, "learning_rate": 4.129208017123954e-05, "loss": 0.007, "step": 159540 }, { "epoch": 1.72, "learning_rate": 4.127586430563663e-05, "loss": 0.0057, "step": 159550 }, { "epoch": 1.72, "learning_rate": 4.125964844003373e-05, "loss": 0.0073, "step": 159560 }, { "epoch": 1.73, "learning_rate": 4.124343257443082e-05, "loss": 0.0062, "step": 159570 }, { "epoch": 1.73, "learning_rate": 4.1227216708827915e-05, "loss": 0.0072, "step": 159580 }, { "epoch": 1.73, "learning_rate": 4.121100084322501e-05, "loss": 0.0086, "step": 159590 }, { "epoch": 1.73, "learning_rate": 4.11947849776221e-05, "loss": 0.0056, "step": 159600 }, { "epoch": 1.73, "learning_rate": 4.11785691120192e-05, "loss": 0.0054, "step": 159610 }, { "epoch": 1.73, "learning_rate": 4.116235324641629e-05, "loss": 0.008, "step": 159620 }, { "epoch": 1.73, "learning_rate": 4.1146137380813386e-05, "loss": 0.0067, "step": 159630 }, { "epoch": 1.73, "learning_rate": 4.112992151521048e-05, "loss": 0.0059, "step": 159640 }, { "epoch": 1.73, "learning_rate": 4.111370564960757e-05, "loss": 0.0048, "step": 159650 }, { "epoch": 1.73, "learning_rate": 4.1097489784004664e-05, "loss": 0.0068, "step": 159660 }, { "epoch": 1.73, "learning_rate": 4.1081273918401763e-05, "loss": 0.0073, "step": 159670 }, { "epoch": 1.73, "learning_rate": 4.1065058052798856e-05, "loss": 0.0075, "step": 159680 }, { "epoch": 1.73, "learning_rate": 4.104884218719595e-05, "loss": 0.0077, "step": 159690 }, { "epoch": 1.73, "learning_rate": 4.103262632159304e-05, "loss": 0.0065, "step": 159700 }, { "epoch": 1.73, "learning_rate": 4.1016410455990134e-05, "loss": 0.0091, "step": 159710 }, { "epoch": 1.73, "learning_rate": 4.1000194590387234e-05, "loss": 0.0066, "step": 159720 }, { "epoch": 1.73, "learning_rate": 4.098397872478433e-05, "loss": 0.0114, "step": 159730 }, { "epoch": 1.73, "learning_rate": 4.096776285918142e-05, "loss": 0.009, "step": 159740 }, { "epoch": 1.73, "learning_rate": 4.095154699357851e-05, "loss": 0.0074, "step": 159750 }, { "epoch": 1.73, "learning_rate": 4.0935331127975605e-05, "loss": 0.0062, "step": 159760 }, { "epoch": 1.73, "learning_rate": 4.09191152623727e-05, "loss": 0.0056, "step": 159770 }, { "epoch": 1.73, "learning_rate": 4.09028993967698e-05, "loss": 0.0054, "step": 159780 }, { "epoch": 1.73, "learning_rate": 4.088668353116689e-05, "loss": 0.0058, "step": 159790 }, { "epoch": 1.73, "learning_rate": 4.087046766556398e-05, "loss": 0.0059, "step": 159800 }, { "epoch": 1.73, "learning_rate": 4.0854251799961075e-05, "loss": 0.0052, "step": 159810 }, { "epoch": 1.73, "learning_rate": 4.083803593435817e-05, "loss": 0.005, "step": 159820 }, { "epoch": 1.73, "learning_rate": 4.082182006875527e-05, "loss": 0.0081, "step": 159830 }, { "epoch": 1.73, "learning_rate": 4.080560420315236e-05, "loss": 0.0101, "step": 159840 }, { "epoch": 1.73, "learning_rate": 4.078938833754945e-05, "loss": 0.0063, "step": 159850 }, { "epoch": 1.73, "learning_rate": 4.0773172471946546e-05, "loss": 0.0063, "step": 159860 }, { "epoch": 1.73, "learning_rate": 4.075695660634364e-05, "loss": 0.0076, "step": 159870 }, { "epoch": 1.73, "learning_rate": 4.074074074074074e-05, "loss": 0.0071, "step": 159880 }, { "epoch": 1.73, "learning_rate": 4.072452487513783e-05, "loss": 0.0084, "step": 159890 }, { "epoch": 1.73, "learning_rate": 4.0708309009534924e-05, "loss": 0.0064, "step": 159900 }, { "epoch": 1.73, "learning_rate": 4.0692093143932016e-05, "loss": 0.0068, "step": 159910 }, { "epoch": 1.73, "learning_rate": 4.067587727832911e-05, "loss": 0.0076, "step": 159920 }, { "epoch": 1.73, "learning_rate": 4.06596614127262e-05, "loss": 0.0059, "step": 159930 }, { "epoch": 1.73, "learning_rate": 4.06434455471233e-05, "loss": 0.0064, "step": 159940 }, { "epoch": 1.73, "learning_rate": 4.0627229681520394e-05, "loss": 0.0089, "step": 159950 }, { "epoch": 1.73, "learning_rate": 4.061101381591749e-05, "loss": 0.0062, "step": 159960 }, { "epoch": 1.73, "learning_rate": 4.059479795031458e-05, "loss": 0.0081, "step": 159970 }, { "epoch": 1.73, "learning_rate": 4.057858208471167e-05, "loss": 0.0089, "step": 159980 }, { "epoch": 1.73, "learning_rate": 4.056236621910877e-05, "loss": 0.0062, "step": 159990 }, { "epoch": 1.73, "learning_rate": 4.0546150353505865e-05, "loss": 0.0063, "step": 160000 }, { "epoch": 1.73, "eval_cer": 0.9215156426706413, "eval_loss": 0.005892171058803797, "eval_runtime": 121.1891, "eval_samples_per_second": 16.503, "eval_steps_per_second": 4.126, "step": 160000 }, { "epoch": 1.73, "learning_rate": 4.052993448790296e-05, "loss": 0.0083, "step": 160010 }, { "epoch": 1.73, "learning_rate": 4.051371862230005e-05, "loss": 0.0068, "step": 160020 }, { "epoch": 1.73, "learning_rate": 4.049750275669714e-05, "loss": 0.0069, "step": 160030 }, { "epoch": 1.73, "learning_rate": 4.0481286891094236e-05, "loss": 0.0071, "step": 160040 }, { "epoch": 1.73, "learning_rate": 4.046507102549134e-05, "loss": 0.0074, "step": 160050 }, { "epoch": 1.73, "learning_rate": 4.0448855159888435e-05, "loss": 0.0065, "step": 160060 }, { "epoch": 1.73, "learning_rate": 4.043263929428553e-05, "loss": 0.0087, "step": 160070 }, { "epoch": 1.73, "learning_rate": 4.041642342868262e-05, "loss": 0.0112, "step": 160080 }, { "epoch": 1.73, "learning_rate": 4.040020756307972e-05, "loss": 0.0078, "step": 160090 }, { "epoch": 1.73, "learning_rate": 4.038399169747681e-05, "loss": 0.0076, "step": 160100 }, { "epoch": 1.73, "learning_rate": 4.0367775831873905e-05, "loss": 0.0074, "step": 160110 }, { "epoch": 1.73, "learning_rate": 4.0351559966271e-05, "loss": 0.0061, "step": 160120 }, { "epoch": 1.73, "learning_rate": 4.033534410066809e-05, "loss": 0.0061, "step": 160130 }, { "epoch": 1.73, "learning_rate": 4.031912823506519e-05, "loss": 0.0053, "step": 160140 }, { "epoch": 1.73, "learning_rate": 4.030291236946228e-05, "loss": 0.0093, "step": 160150 }, { "epoch": 1.73, "learning_rate": 4.0286696503859376e-05, "loss": 0.0088, "step": 160160 }, { "epoch": 1.73, "learning_rate": 4.027048063825647e-05, "loss": 0.0068, "step": 160170 }, { "epoch": 1.73, "learning_rate": 4.025426477265356e-05, "loss": 0.0071, "step": 160180 }, { "epoch": 1.73, "learning_rate": 4.023804890705066e-05, "loss": 0.0074, "step": 160190 }, { "epoch": 1.73, "learning_rate": 4.0221833041447753e-05, "loss": 0.0055, "step": 160200 }, { "epoch": 1.73, "learning_rate": 4.0205617175844846e-05, "loss": 0.0058, "step": 160210 }, { "epoch": 1.73, "learning_rate": 4.018940131024194e-05, "loss": 0.0058, "step": 160220 }, { "epoch": 1.73, "learning_rate": 4.017318544463903e-05, "loss": 0.0065, "step": 160230 }, { "epoch": 1.73, "learning_rate": 4.0156969579036124e-05, "loss": 0.0057, "step": 160240 }, { "epoch": 1.73, "learning_rate": 4.0140753713433224e-05, "loss": 0.0061, "step": 160250 }, { "epoch": 1.73, "learning_rate": 4.012453784783032e-05, "loss": 0.0058, "step": 160260 }, { "epoch": 1.73, "learning_rate": 4.010832198222741e-05, "loss": 0.0076, "step": 160270 }, { "epoch": 1.73, "learning_rate": 4.00921061166245e-05, "loss": 0.0069, "step": 160280 }, { "epoch": 1.73, "learning_rate": 4.0075890251021595e-05, "loss": 0.0085, "step": 160290 }, { "epoch": 1.73, "learning_rate": 4.0059674385418694e-05, "loss": 0.0069, "step": 160300 }, { "epoch": 1.73, "learning_rate": 4.004345851981579e-05, "loss": 0.0102, "step": 160310 }, { "epoch": 1.73, "learning_rate": 4.002724265421288e-05, "loss": 0.0066, "step": 160320 }, { "epoch": 1.73, "learning_rate": 4.001102678860997e-05, "loss": 0.006, "step": 160330 }, { "epoch": 1.73, "learning_rate": 3.9994810923007065e-05, "loss": 0.0056, "step": 160340 }, { "epoch": 1.73, "learning_rate": 3.997859505740416e-05, "loss": 0.0083, "step": 160350 }, { "epoch": 1.73, "learning_rate": 3.996237919180126e-05, "loss": 0.0056, "step": 160360 }, { "epoch": 1.73, "learning_rate": 3.994616332619835e-05, "loss": 0.0057, "step": 160370 }, { "epoch": 1.73, "learning_rate": 3.992994746059544e-05, "loss": 0.0086, "step": 160380 }, { "epoch": 1.73, "learning_rate": 3.9913731594992536e-05, "loss": 0.0067, "step": 160390 }, { "epoch": 1.73, "learning_rate": 3.989751572938963e-05, "loss": 0.0066, "step": 160400 }, { "epoch": 1.73, "learning_rate": 3.988129986378673e-05, "loss": 0.0071, "step": 160410 }, { "epoch": 1.73, "learning_rate": 3.986508399818382e-05, "loss": 0.0061, "step": 160420 }, { "epoch": 1.73, "learning_rate": 3.9848868132580914e-05, "loss": 0.0084, "step": 160430 }, { "epoch": 1.73, "learning_rate": 3.9832652266978006e-05, "loss": 0.0106, "step": 160440 }, { "epoch": 1.73, "learning_rate": 3.98164364013751e-05, "loss": 0.0099, "step": 160450 }, { "epoch": 1.73, "learning_rate": 3.98002205357722e-05, "loss": 0.0051, "step": 160460 }, { "epoch": 1.73, "learning_rate": 3.978400467016929e-05, "loss": 0.0067, "step": 160470 }, { "epoch": 1.73, "learning_rate": 3.9767788804566384e-05, "loss": 0.0073, "step": 160480 }, { "epoch": 1.73, "learning_rate": 3.975157293896348e-05, "loss": 0.0066, "step": 160490 }, { "epoch": 1.74, "learning_rate": 3.973535707336057e-05, "loss": 0.0068, "step": 160500 }, { "epoch": 1.74, "learning_rate": 3.971914120775766e-05, "loss": 0.0058, "step": 160510 }, { "epoch": 1.74, "learning_rate": 3.970292534215476e-05, "loss": 0.0056, "step": 160520 }, { "epoch": 1.74, "learning_rate": 3.9686709476551855e-05, "loss": 0.0097, "step": 160530 }, { "epoch": 1.74, "learning_rate": 3.967049361094895e-05, "loss": 0.0054, "step": 160540 }, { "epoch": 1.74, "learning_rate": 3.965427774534604e-05, "loss": 0.0077, "step": 160550 }, { "epoch": 1.74, "learning_rate": 3.963806187974313e-05, "loss": 0.0057, "step": 160560 }, { "epoch": 1.74, "learning_rate": 3.962184601414023e-05, "loss": 0.0051, "step": 160570 }, { "epoch": 1.74, "learning_rate": 3.9605630148537325e-05, "loss": 0.0072, "step": 160580 }, { "epoch": 1.74, "learning_rate": 3.958941428293442e-05, "loss": 0.0072, "step": 160590 }, { "epoch": 1.74, "learning_rate": 3.957319841733151e-05, "loss": 0.0065, "step": 160600 }, { "epoch": 1.74, "learning_rate": 3.95569825517286e-05, "loss": 0.0072, "step": 160610 }, { "epoch": 1.74, "learning_rate": 3.9540766686125696e-05, "loss": 0.0084, "step": 160620 }, { "epoch": 1.74, "learning_rate": 3.9524550820522796e-05, "loss": 0.0067, "step": 160630 }, { "epoch": 1.74, "learning_rate": 3.950833495491989e-05, "loss": 0.0081, "step": 160640 }, { "epoch": 1.74, "learning_rate": 3.949211908931698e-05, "loss": 0.0072, "step": 160650 }, { "epoch": 1.74, "learning_rate": 3.9475903223714074e-05, "loss": 0.0086, "step": 160660 }, { "epoch": 1.74, "learning_rate": 3.9459687358111167e-05, "loss": 0.0085, "step": 160670 }, { "epoch": 1.74, "learning_rate": 3.9443471492508266e-05, "loss": 0.0054, "step": 160680 }, { "epoch": 1.74, "learning_rate": 3.942725562690536e-05, "loss": 0.0095, "step": 160690 }, { "epoch": 1.74, "learning_rate": 3.941103976130245e-05, "loss": 0.0081, "step": 160700 }, { "epoch": 1.74, "learning_rate": 3.9394823895699544e-05, "loss": 0.0069, "step": 160710 }, { "epoch": 1.74, "learning_rate": 3.937860803009664e-05, "loss": 0.008, "step": 160720 }, { "epoch": 1.74, "learning_rate": 3.9362392164493737e-05, "loss": 0.0078, "step": 160730 }, { "epoch": 1.74, "learning_rate": 3.934617629889083e-05, "loss": 0.0046, "step": 160740 }, { "epoch": 1.74, "learning_rate": 3.932996043328792e-05, "loss": 0.0046, "step": 160750 }, { "epoch": 1.74, "learning_rate": 3.9313744567685015e-05, "loss": 0.0062, "step": 160760 }, { "epoch": 1.74, "learning_rate": 3.929752870208212e-05, "loss": 0.0075, "step": 160770 }, { "epoch": 1.74, "learning_rate": 3.9281312836479214e-05, "loss": 0.0069, "step": 160780 }, { "epoch": 1.74, "learning_rate": 3.9265096970876307e-05, "loss": 0.0052, "step": 160790 }, { "epoch": 1.74, "learning_rate": 3.92488811052734e-05, "loss": 0.0087, "step": 160800 }, { "epoch": 1.74, "learning_rate": 3.923266523967049e-05, "loss": 0.0075, "step": 160810 }, { "epoch": 1.74, "learning_rate": 3.9216449374067585e-05, "loss": 0.0039, "step": 160820 }, { "epoch": 1.74, "learning_rate": 3.9200233508464684e-05, "loss": 0.0059, "step": 160830 }, { "epoch": 1.74, "learning_rate": 3.918401764286178e-05, "loss": 0.0086, "step": 160840 }, { "epoch": 1.74, "learning_rate": 3.916780177725887e-05, "loss": 0.0062, "step": 160850 }, { "epoch": 1.74, "learning_rate": 3.915158591165596e-05, "loss": 0.0077, "step": 160860 }, { "epoch": 1.74, "learning_rate": 3.9135370046053055e-05, "loss": 0.0061, "step": 160870 }, { "epoch": 1.74, "learning_rate": 3.9119154180450155e-05, "loss": 0.0061, "step": 160880 }, { "epoch": 1.74, "learning_rate": 3.910293831484725e-05, "loss": 0.0052, "step": 160890 }, { "epoch": 1.74, "learning_rate": 3.908672244924434e-05, "loss": 0.0074, "step": 160900 }, { "epoch": 1.74, "learning_rate": 3.907050658364143e-05, "loss": 0.0077, "step": 160910 }, { "epoch": 1.74, "learning_rate": 3.9054290718038526e-05, "loss": 0.0094, "step": 160920 }, { "epoch": 1.74, "learning_rate": 3.903807485243562e-05, "loss": 0.0057, "step": 160930 }, { "epoch": 1.74, "learning_rate": 3.902185898683272e-05, "loss": 0.006, "step": 160940 }, { "epoch": 1.74, "learning_rate": 3.900564312122981e-05, "loss": 0.0066, "step": 160950 }, { "epoch": 1.74, "learning_rate": 3.8989427255626904e-05, "loss": 0.0076, "step": 160960 }, { "epoch": 1.74, "learning_rate": 3.8973211390023996e-05, "loss": 0.0072, "step": 160970 }, { "epoch": 1.74, "learning_rate": 3.895699552442109e-05, "loss": 0.006, "step": 160980 }, { "epoch": 1.74, "learning_rate": 3.894077965881819e-05, "loss": 0.0077, "step": 160990 }, { "epoch": 1.74, "learning_rate": 3.892456379321528e-05, "loss": 0.0065, "step": 161000 }, { "epoch": 1.74, "eval_cer": 0.9215034822292522, "eval_loss": 0.0055848234333097935, "eval_runtime": 121.2713, "eval_samples_per_second": 16.492, "eval_steps_per_second": 4.123, "step": 161000 }, { "epoch": 1.74, "learning_rate": 3.8908347927612374e-05, "loss": 0.0072, "step": 161010 }, { "epoch": 1.74, "learning_rate": 3.889213206200947e-05, "loss": 0.0066, "step": 161020 }, { "epoch": 1.74, "learning_rate": 3.887591619640656e-05, "loss": 0.0064, "step": 161030 }, { "epoch": 1.74, "learning_rate": 3.885970033080366e-05, "loss": 0.0075, "step": 161040 }, { "epoch": 1.74, "learning_rate": 3.884348446520075e-05, "loss": 0.0064, "step": 161050 }, { "epoch": 1.74, "learning_rate": 3.8827268599597845e-05, "loss": 0.0071, "step": 161060 }, { "epoch": 1.74, "learning_rate": 3.881105273399494e-05, "loss": 0.0065, "step": 161070 }, { "epoch": 1.74, "learning_rate": 3.879483686839203e-05, "loss": 0.0063, "step": 161080 }, { "epoch": 1.74, "learning_rate": 3.877862100278912e-05, "loss": 0.0061, "step": 161090 }, { "epoch": 1.74, "learning_rate": 3.876240513718622e-05, "loss": 0.0068, "step": 161100 }, { "epoch": 1.74, "learning_rate": 3.8746189271583315e-05, "loss": 0.0102, "step": 161110 }, { "epoch": 1.74, "learning_rate": 3.872997340598041e-05, "loss": 0.0061, "step": 161120 }, { "epoch": 1.74, "learning_rate": 3.87137575403775e-05, "loss": 0.0063, "step": 161130 }, { "epoch": 1.74, "learning_rate": 3.869754167477459e-05, "loss": 0.0073, "step": 161140 }, { "epoch": 1.74, "learning_rate": 3.868132580917169e-05, "loss": 0.0067, "step": 161150 }, { "epoch": 1.74, "learning_rate": 3.8665109943568786e-05, "loss": 0.0061, "step": 161160 }, { "epoch": 1.74, "learning_rate": 3.864889407796588e-05, "loss": 0.0053, "step": 161170 }, { "epoch": 1.74, "learning_rate": 3.863267821236297e-05, "loss": 0.0071, "step": 161180 }, { "epoch": 1.74, "learning_rate": 3.8616462346760064e-05, "loss": 0.0062, "step": 161190 }, { "epoch": 1.74, "learning_rate": 3.860024648115716e-05, "loss": 0.0074, "step": 161200 }, { "epoch": 1.74, "learning_rate": 3.8584030615554256e-05, "loss": 0.0066, "step": 161210 }, { "epoch": 1.74, "learning_rate": 3.856781474995135e-05, "loss": 0.007, "step": 161220 }, { "epoch": 1.74, "learning_rate": 3.855159888434844e-05, "loss": 0.0078, "step": 161230 }, { "epoch": 1.74, "learning_rate": 3.8535383018745534e-05, "loss": 0.005, "step": 161240 }, { "epoch": 1.74, "learning_rate": 3.851916715314263e-05, "loss": 0.0076, "step": 161250 }, { "epoch": 1.74, "learning_rate": 3.8502951287539727e-05, "loss": 0.0065, "step": 161260 }, { "epoch": 1.74, "learning_rate": 3.848673542193682e-05, "loss": 0.0076, "step": 161270 }, { "epoch": 1.74, "learning_rate": 3.847051955633391e-05, "loss": 0.0086, "step": 161280 }, { "epoch": 1.74, "learning_rate": 3.8454303690731005e-05, "loss": 0.0066, "step": 161290 }, { "epoch": 1.74, "learning_rate": 3.84380878251281e-05, "loss": 0.0052, "step": 161300 }, { "epoch": 1.74, "learning_rate": 3.84218719595252e-05, "loss": 0.0063, "step": 161310 }, { "epoch": 1.74, "learning_rate": 3.840565609392229e-05, "loss": 0.005, "step": 161320 }, { "epoch": 1.74, "learning_rate": 3.838944022831938e-05, "loss": 0.0071, "step": 161330 }, { "epoch": 1.74, "learning_rate": 3.8373224362716475e-05, "loss": 0.0055, "step": 161340 }, { "epoch": 1.74, "learning_rate": 3.835700849711357e-05, "loss": 0.0052, "step": 161350 }, { "epoch": 1.74, "learning_rate": 3.834079263151066e-05, "loss": 0.0084, "step": 161360 }, { "epoch": 1.74, "learning_rate": 3.832457676590776e-05, "loss": 0.007, "step": 161370 }, { "epoch": 1.74, "learning_rate": 3.830836090030485e-05, "loss": 0.008, "step": 161380 }, { "epoch": 1.74, "learning_rate": 3.8292145034701946e-05, "loss": 0.0048, "step": 161390 }, { "epoch": 1.74, "learning_rate": 3.827592916909904e-05, "loss": 0.006, "step": 161400 }, { "epoch": 1.74, "learning_rate": 3.825971330349613e-05, "loss": 0.0049, "step": 161410 }, { "epoch": 1.75, "learning_rate": 3.824349743789323e-05, "loss": 0.0084, "step": 161420 }, { "epoch": 1.75, "learning_rate": 3.8227281572290323e-05, "loss": 0.0067, "step": 161430 }, { "epoch": 1.75, "learning_rate": 3.8211065706687416e-05, "loss": 0.0061, "step": 161440 }, { "epoch": 1.75, "learning_rate": 3.819484984108451e-05, "loss": 0.0071, "step": 161450 }, { "epoch": 1.75, "learning_rate": 3.81786339754816e-05, "loss": 0.0062, "step": 161460 }, { "epoch": 1.75, "learning_rate": 3.81624181098787e-05, "loss": 0.0053, "step": 161470 }, { "epoch": 1.75, "learning_rate": 3.8146202244275794e-05, "loss": 0.0071, "step": 161480 }, { "epoch": 1.75, "learning_rate": 3.8129986378672893e-05, "loss": 0.006, "step": 161490 }, { "epoch": 1.75, "learning_rate": 3.8113770513069986e-05, "loss": 0.0069, "step": 161500 }, { "epoch": 1.75, "learning_rate": 3.809755464746708e-05, "loss": 0.0064, "step": 161510 }, { "epoch": 1.75, "learning_rate": 3.808133878186418e-05, "loss": 0.0081, "step": 161520 }, { "epoch": 1.75, "learning_rate": 3.806512291626127e-05, "loss": 0.0054, "step": 161530 }, { "epoch": 1.75, "learning_rate": 3.8048907050658364e-05, "loss": 0.0062, "step": 161540 }, { "epoch": 1.75, "learning_rate": 3.803269118505546e-05, "loss": 0.0076, "step": 161550 }, { "epoch": 1.75, "learning_rate": 3.801647531945255e-05, "loss": 0.0064, "step": 161560 }, { "epoch": 1.75, "learning_rate": 3.800025945384965e-05, "loss": 0.0082, "step": 161570 }, { "epoch": 1.75, "learning_rate": 3.798404358824674e-05, "loss": 0.0061, "step": 161580 }, { "epoch": 1.75, "learning_rate": 3.7967827722643834e-05, "loss": 0.0057, "step": 161590 }, { "epoch": 1.75, "learning_rate": 3.795161185704093e-05, "loss": 0.0068, "step": 161600 }, { "epoch": 1.75, "learning_rate": 3.793539599143802e-05, "loss": 0.0075, "step": 161610 }, { "epoch": 1.75, "learning_rate": 3.791918012583512e-05, "loss": 0.0061, "step": 161620 }, { "epoch": 1.75, "learning_rate": 3.790296426023221e-05, "loss": 0.0062, "step": 161630 }, { "epoch": 1.75, "learning_rate": 3.7886748394629305e-05, "loss": 0.0065, "step": 161640 }, { "epoch": 1.75, "learning_rate": 3.78705325290264e-05, "loss": 0.008, "step": 161650 }, { "epoch": 1.75, "learning_rate": 3.785431666342349e-05, "loss": 0.0075, "step": 161660 }, { "epoch": 1.75, "learning_rate": 3.783810079782058e-05, "loss": 0.0077, "step": 161670 }, { "epoch": 1.75, "learning_rate": 3.782188493221768e-05, "loss": 0.0071, "step": 161680 }, { "epoch": 1.75, "learning_rate": 3.7805669066614775e-05, "loss": 0.006, "step": 161690 }, { "epoch": 1.75, "learning_rate": 3.778945320101187e-05, "loss": 0.0062, "step": 161700 }, { "epoch": 1.75, "learning_rate": 3.777323733540896e-05, "loss": 0.0119, "step": 161710 }, { "epoch": 1.75, "learning_rate": 3.7757021469806054e-05, "loss": 0.0074, "step": 161720 }, { "epoch": 1.75, "learning_rate": 3.774080560420315e-05, "loss": 0.0055, "step": 161730 }, { "epoch": 1.75, "learning_rate": 3.7724589738600246e-05, "loss": 0.0059, "step": 161740 }, { "epoch": 1.75, "learning_rate": 3.770837387299734e-05, "loss": 0.0064, "step": 161750 }, { "epoch": 1.75, "learning_rate": 3.769215800739443e-05, "loss": 0.0056, "step": 161760 }, { "epoch": 1.75, "learning_rate": 3.7675942141791524e-05, "loss": 0.0076, "step": 161770 }, { "epoch": 1.75, "learning_rate": 3.7659726276188624e-05, "loss": 0.0053, "step": 161780 }, { "epoch": 1.75, "learning_rate": 3.7643510410585716e-05, "loss": 0.0048, "step": 161790 }, { "epoch": 1.75, "learning_rate": 3.762729454498281e-05, "loss": 0.0068, "step": 161800 }, { "epoch": 1.75, "learning_rate": 3.76110786793799e-05, "loss": 0.0059, "step": 161810 }, { "epoch": 1.75, "learning_rate": 3.7594862813776995e-05, "loss": 0.0063, "step": 161820 }, { "epoch": 1.75, "learning_rate": 3.757864694817409e-05, "loss": 0.0084, "step": 161830 }, { "epoch": 1.75, "learning_rate": 3.756243108257119e-05, "loss": 0.0073, "step": 161840 }, { "epoch": 1.75, "learning_rate": 3.754621521696828e-05, "loss": 0.0068, "step": 161850 }, { "epoch": 1.75, "learning_rate": 3.752999935136537e-05, "loss": 0.008, "step": 161860 }, { "epoch": 1.75, "learning_rate": 3.7513783485762465e-05, "loss": 0.0066, "step": 161870 }, { "epoch": 1.75, "learning_rate": 3.749756762015956e-05, "loss": 0.0089, "step": 161880 }, { "epoch": 1.75, "learning_rate": 3.748135175455666e-05, "loss": 0.0073, "step": 161890 }, { "epoch": 1.75, "learning_rate": 3.746513588895375e-05, "loss": 0.0062, "step": 161900 }, { "epoch": 1.75, "learning_rate": 3.744892002335084e-05, "loss": 0.0061, "step": 161910 }, { "epoch": 1.75, "learning_rate": 3.7432704157747936e-05, "loss": 0.0055, "step": 161920 }, { "epoch": 1.75, "learning_rate": 3.741648829214503e-05, "loss": 0.0054, "step": 161930 }, { "epoch": 1.75, "learning_rate": 3.740027242654212e-05, "loss": 0.0076, "step": 161940 }, { "epoch": 1.75, "learning_rate": 3.738405656093922e-05, "loss": 0.0062, "step": 161950 }, { "epoch": 1.75, "learning_rate": 3.7367840695336313e-05, "loss": 0.0067, "step": 161960 }, { "epoch": 1.75, "learning_rate": 3.7351624829733406e-05, "loss": 0.0102, "step": 161970 }, { "epoch": 1.75, "learning_rate": 3.73354089641305e-05, "loss": 0.0063, "step": 161980 }, { "epoch": 1.75, "learning_rate": 3.731919309852759e-05, "loss": 0.0078, "step": 161990 }, { "epoch": 1.75, "learning_rate": 3.730297723292469e-05, "loss": 0.0105, "step": 162000 }, { "epoch": 1.75, "eval_cer": 0.9215130368617722, "eval_loss": 0.005664716940373182, "eval_runtime": 121.2783, "eval_samples_per_second": 16.491, "eval_steps_per_second": 4.123, "step": 162000 }, { "epoch": 1.75, "learning_rate": 3.7286761367321784e-05, "loss": 0.0052, "step": 162010 }, { "epoch": 1.75, "learning_rate": 3.727054550171888e-05, "loss": 0.0084, "step": 162020 }, { "epoch": 1.75, "learning_rate": 3.7254329636115976e-05, "loss": 0.0055, "step": 162030 }, { "epoch": 1.75, "learning_rate": 3.723811377051307e-05, "loss": 0.0059, "step": 162040 }, { "epoch": 1.75, "learning_rate": 3.722189790491016e-05, "loss": 0.0044, "step": 162050 }, { "epoch": 1.75, "learning_rate": 3.7205682039307254e-05, "loss": 0.0063, "step": 162060 }, { "epoch": 1.75, "learning_rate": 3.7189466173704354e-05, "loss": 0.0067, "step": 162070 }, { "epoch": 1.75, "learning_rate": 3.717325030810145e-05, "loss": 0.0112, "step": 162080 }, { "epoch": 1.75, "learning_rate": 3.715703444249854e-05, "loss": 0.0063, "step": 162090 }, { "epoch": 1.75, "learning_rate": 3.714081857689563e-05, "loss": 0.0088, "step": 162100 }, { "epoch": 1.75, "learning_rate": 3.7124602711292725e-05, "loss": 0.0062, "step": 162110 }, { "epoch": 1.75, "learning_rate": 3.710838684568982e-05, "loss": 0.0074, "step": 162120 }, { "epoch": 1.75, "learning_rate": 3.709217098008692e-05, "loss": 0.0079, "step": 162130 }, { "epoch": 1.75, "learning_rate": 3.707595511448401e-05, "loss": 0.0078, "step": 162140 }, { "epoch": 1.75, "learning_rate": 3.70597392488811e-05, "loss": 0.0077, "step": 162150 }, { "epoch": 1.75, "learning_rate": 3.7043523383278195e-05, "loss": 0.0048, "step": 162160 }, { "epoch": 1.75, "learning_rate": 3.702730751767529e-05, "loss": 0.0054, "step": 162170 }, { "epoch": 1.75, "learning_rate": 3.701109165207239e-05, "loss": 0.0072, "step": 162180 }, { "epoch": 1.75, "learning_rate": 3.699487578646948e-05, "loss": 0.0066, "step": 162190 }, { "epoch": 1.75, "learning_rate": 3.697865992086657e-05, "loss": 0.0058, "step": 162200 }, { "epoch": 1.75, "learning_rate": 3.6962444055263666e-05, "loss": 0.0089, "step": 162210 }, { "epoch": 1.75, "learning_rate": 3.694622818966076e-05, "loss": 0.007, "step": 162220 }, { "epoch": 1.75, "learning_rate": 3.693001232405785e-05, "loss": 0.0063, "step": 162230 }, { "epoch": 1.75, "learning_rate": 3.691379645845495e-05, "loss": 0.0073, "step": 162240 }, { "epoch": 1.75, "learning_rate": 3.6897580592852044e-05, "loss": 0.0066, "step": 162250 }, { "epoch": 1.75, "learning_rate": 3.6881364727249136e-05, "loss": 0.0053, "step": 162260 }, { "epoch": 1.75, "learning_rate": 3.686514886164623e-05, "loss": 0.0081, "step": 162270 }, { "epoch": 1.75, "learning_rate": 3.684893299604332e-05, "loss": 0.0075, "step": 162280 }, { "epoch": 1.75, "learning_rate": 3.683271713044042e-05, "loss": 0.0049, "step": 162290 }, { "epoch": 1.75, "learning_rate": 3.6816501264837514e-05, "loss": 0.0072, "step": 162300 }, { "epoch": 1.75, "learning_rate": 3.680028539923461e-05, "loss": 0.007, "step": 162310 }, { "epoch": 1.75, "learning_rate": 3.67840695336317e-05, "loss": 0.0092, "step": 162320 }, { "epoch": 1.75, "learning_rate": 3.676785366802879e-05, "loss": 0.0072, "step": 162330 }, { "epoch": 1.75, "learning_rate": 3.675163780242589e-05, "loss": 0.0078, "step": 162340 }, { "epoch": 1.76, "learning_rate": 3.6735421936822985e-05, "loss": 0.008, "step": 162350 }, { "epoch": 1.76, "learning_rate": 3.671920607122008e-05, "loss": 0.0068, "step": 162360 }, { "epoch": 1.76, "learning_rate": 3.670299020561717e-05, "loss": 0.0055, "step": 162370 }, { "epoch": 1.76, "learning_rate": 3.668677434001426e-05, "loss": 0.0074, "step": 162380 }, { "epoch": 1.76, "learning_rate": 3.667055847441136e-05, "loss": 0.0069, "step": 162390 }, { "epoch": 1.76, "learning_rate": 3.6654342608808455e-05, "loss": 0.0058, "step": 162400 }, { "epoch": 1.76, "learning_rate": 3.663812674320555e-05, "loss": 0.0069, "step": 162410 }, { "epoch": 1.76, "learning_rate": 3.662191087760265e-05, "loss": 0.0066, "step": 162420 }, { "epoch": 1.76, "learning_rate": 3.660569501199974e-05, "loss": 0.0075, "step": 162430 }, { "epoch": 1.76, "learning_rate": 3.658947914639683e-05, "loss": 0.0084, "step": 162440 }, { "epoch": 1.76, "learning_rate": 3.6573263280793926e-05, "loss": 0.0076, "step": 162450 }, { "epoch": 1.76, "learning_rate": 3.655704741519102e-05, "loss": 0.005, "step": 162460 }, { "epoch": 1.76, "learning_rate": 3.654083154958812e-05, "loss": 0.0092, "step": 162470 }, { "epoch": 1.76, "learning_rate": 3.652461568398521e-05, "loss": 0.006, "step": 162480 }, { "epoch": 1.76, "learning_rate": 3.65083998183823e-05, "loss": 0.0047, "step": 162490 }, { "epoch": 1.76, "learning_rate": 3.6492183952779396e-05, "loss": 0.0073, "step": 162500 }, { "epoch": 1.76, "learning_rate": 3.647596808717649e-05, "loss": 0.0115, "step": 162510 }, { "epoch": 1.76, "learning_rate": 3.645975222157358e-05, "loss": 0.0083, "step": 162520 }, { "epoch": 1.76, "learning_rate": 3.644353635597068e-05, "loss": 0.0053, "step": 162530 }, { "epoch": 1.76, "learning_rate": 3.6427320490367774e-05, "loss": 0.0066, "step": 162540 }, { "epoch": 1.76, "learning_rate": 3.6411104624764867e-05, "loss": 0.0058, "step": 162550 }, { "epoch": 1.76, "learning_rate": 3.639488875916196e-05, "loss": 0.0067, "step": 162560 }, { "epoch": 1.76, "learning_rate": 3.637867289355905e-05, "loss": 0.0064, "step": 162570 }, { "epoch": 1.76, "learning_rate": 3.636245702795615e-05, "loss": 0.0067, "step": 162580 }, { "epoch": 1.76, "learning_rate": 3.6346241162353244e-05, "loss": 0.0061, "step": 162590 }, { "epoch": 1.76, "learning_rate": 3.633002529675034e-05, "loss": 0.006, "step": 162600 }, { "epoch": 1.76, "learning_rate": 3.631380943114743e-05, "loss": 0.0077, "step": 162610 }, { "epoch": 1.76, "learning_rate": 3.629759356554452e-05, "loss": 0.0077, "step": 162620 }, { "epoch": 1.76, "learning_rate": 3.628137769994162e-05, "loss": 0.0061, "step": 162630 }, { "epoch": 1.76, "learning_rate": 3.6265161834338715e-05, "loss": 0.0089, "step": 162640 }, { "epoch": 1.76, "learning_rate": 3.624894596873581e-05, "loss": 0.008, "step": 162650 }, { "epoch": 1.76, "learning_rate": 3.62327301031329e-05, "loss": 0.0078, "step": 162660 }, { "epoch": 1.76, "learning_rate": 3.621651423752999e-05, "loss": 0.0072, "step": 162670 }, { "epoch": 1.76, "learning_rate": 3.6200298371927086e-05, "loss": 0.0051, "step": 162680 }, { "epoch": 1.76, "learning_rate": 3.6184082506324185e-05, "loss": 0.0081, "step": 162690 }, { "epoch": 1.76, "learning_rate": 3.616786664072128e-05, "loss": 0.0064, "step": 162700 }, { "epoch": 1.76, "learning_rate": 3.615165077511837e-05, "loss": 0.0082, "step": 162710 }, { "epoch": 1.76, "learning_rate": 3.6135434909515464e-05, "loss": 0.0059, "step": 162720 }, { "epoch": 1.76, "learning_rate": 3.6119219043912556e-05, "loss": 0.0092, "step": 162730 }, { "epoch": 1.76, "learning_rate": 3.6103003178309656e-05, "loss": 0.008, "step": 162740 }, { "epoch": 1.76, "learning_rate": 3.608678731270675e-05, "loss": 0.0084, "step": 162750 }, { "epoch": 1.76, "learning_rate": 3.607057144710385e-05, "loss": 0.0088, "step": 162760 }, { "epoch": 1.76, "learning_rate": 3.605435558150094e-05, "loss": 0.0074, "step": 162770 }, { "epoch": 1.76, "learning_rate": 3.6038139715898034e-05, "loss": 0.0097, "step": 162780 }, { "epoch": 1.76, "learning_rate": 3.6021923850295126e-05, "loss": 0.0073, "step": 162790 }, { "epoch": 1.76, "learning_rate": 3.600570798469222e-05, "loss": 0.0083, "step": 162800 }, { "epoch": 1.76, "learning_rate": 3.598949211908931e-05, "loss": 0.0063, "step": 162810 }, { "epoch": 1.76, "learning_rate": 3.597327625348641e-05, "loss": 0.0082, "step": 162820 }, { "epoch": 1.76, "learning_rate": 3.5957060387883504e-05, "loss": 0.0059, "step": 162830 }, { "epoch": 1.76, "learning_rate": 3.59408445222806e-05, "loss": 0.0073, "step": 162840 }, { "epoch": 1.76, "learning_rate": 3.592462865667769e-05, "loss": 0.0061, "step": 162850 }, { "epoch": 1.76, "learning_rate": 3.590841279107478e-05, "loss": 0.0084, "step": 162860 }, { "epoch": 1.76, "learning_rate": 3.589219692547188e-05, "loss": 0.0067, "step": 162870 }, { "epoch": 1.76, "learning_rate": 3.5875981059868975e-05, "loss": 0.0064, "step": 162880 }, { "epoch": 1.76, "learning_rate": 3.585976519426607e-05, "loss": 0.0071, "step": 162890 }, { "epoch": 1.76, "learning_rate": 3.584354932866316e-05, "loss": 0.0073, "step": 162900 }, { "epoch": 1.76, "learning_rate": 3.582733346306025e-05, "loss": 0.0064, "step": 162910 }, { "epoch": 1.76, "learning_rate": 3.581111759745735e-05, "loss": 0.0066, "step": 162920 }, { "epoch": 1.76, "learning_rate": 3.5794901731854445e-05, "loss": 0.0066, "step": 162930 }, { "epoch": 1.76, "learning_rate": 3.577868586625154e-05, "loss": 0.0065, "step": 162940 }, { "epoch": 1.76, "learning_rate": 3.576247000064863e-05, "loss": 0.0063, "step": 162950 }, { "epoch": 1.76, "learning_rate": 3.574625413504572e-05, "loss": 0.0044, "step": 162960 }, { "epoch": 1.76, "learning_rate": 3.5730038269442816e-05, "loss": 0.0057, "step": 162970 }, { "epoch": 1.76, "learning_rate": 3.5713822403839916e-05, "loss": 0.0064, "step": 162980 }, { "epoch": 1.76, "learning_rate": 3.569760653823701e-05, "loss": 0.007, "step": 162990 }, { "epoch": 1.76, "learning_rate": 3.56813906726341e-05, "loss": 0.0075, "step": 163000 }, { "epoch": 1.76, "eval_cer": 0.921507825244034, "eval_loss": 0.005535805597901344, "eval_runtime": 121.0817, "eval_samples_per_second": 16.518, "eval_steps_per_second": 4.129, "step": 163000 }, { "epoch": 1.76, "learning_rate": 3.5665174807031194e-05, "loss": 0.0066, "step": 163010 }, { "epoch": 1.76, "learning_rate": 3.5648958941428287e-05, "loss": 0.0079, "step": 163020 }, { "epoch": 1.76, "learning_rate": 3.5632743075825386e-05, "loss": 0.0076, "step": 163030 }, { "epoch": 1.76, "learning_rate": 3.561652721022248e-05, "loss": 0.0053, "step": 163040 }, { "epoch": 1.76, "learning_rate": 3.560031134461957e-05, "loss": 0.0076, "step": 163050 }, { "epoch": 1.76, "learning_rate": 3.5584095479016664e-05, "loss": 0.0066, "step": 163060 }, { "epoch": 1.76, "learning_rate": 3.556787961341376e-05, "loss": 0.0053, "step": 163070 }, { "epoch": 1.76, "learning_rate": 3.5551663747810857e-05, "loss": 0.0065, "step": 163080 }, { "epoch": 1.76, "learning_rate": 3.553544788220795e-05, "loss": 0.0058, "step": 163090 }, { "epoch": 1.76, "learning_rate": 3.551923201660504e-05, "loss": 0.0076, "step": 163100 }, { "epoch": 1.76, "learning_rate": 3.550301615100214e-05, "loss": 0.0049, "step": 163110 }, { "epoch": 1.76, "learning_rate": 3.5486800285399234e-05, "loss": 0.008, "step": 163120 }, { "epoch": 1.76, "learning_rate": 3.547058441979633e-05, "loss": 0.0091, "step": 163130 }, { "epoch": 1.76, "learning_rate": 3.545436855419342e-05, "loss": 0.0063, "step": 163140 }, { "epoch": 1.76, "learning_rate": 3.543815268859051e-05, "loss": 0.0049, "step": 163150 }, { "epoch": 1.76, "learning_rate": 3.542193682298761e-05, "loss": 0.0052, "step": 163160 }, { "epoch": 1.76, "learning_rate": 3.5405720957384705e-05, "loss": 0.0064, "step": 163170 }, { "epoch": 1.76, "learning_rate": 3.53895050917818e-05, "loss": 0.0053, "step": 163180 }, { "epoch": 1.76, "learning_rate": 3.537328922617889e-05, "loss": 0.0065, "step": 163190 }, { "epoch": 1.76, "learning_rate": 3.535707336057598e-05, "loss": 0.0061, "step": 163200 }, { "epoch": 1.76, "learning_rate": 3.534085749497308e-05, "loss": 0.0055, "step": 163210 }, { "epoch": 1.76, "learning_rate": 3.5324641629370175e-05, "loss": 0.0064, "step": 163220 }, { "epoch": 1.76, "learning_rate": 3.530842576376727e-05, "loss": 0.0075, "step": 163230 }, { "epoch": 1.76, "learning_rate": 3.529220989816436e-05, "loss": 0.0064, "step": 163240 }, { "epoch": 1.76, "learning_rate": 3.5275994032561454e-05, "loss": 0.0073, "step": 163250 }, { "epoch": 1.76, "learning_rate": 3.5259778166958546e-05, "loss": 0.0079, "step": 163260 }, { "epoch": 1.77, "learning_rate": 3.5243562301355646e-05, "loss": 0.0069, "step": 163270 }, { "epoch": 1.77, "learning_rate": 3.522734643575274e-05, "loss": 0.0068, "step": 163280 }, { "epoch": 1.77, "learning_rate": 3.521113057014983e-05, "loss": 0.0054, "step": 163290 }, { "epoch": 1.77, "learning_rate": 3.5194914704546924e-05, "loss": 0.0075, "step": 163300 }, { "epoch": 1.77, "learning_rate": 3.517869883894402e-05, "loss": 0.0084, "step": 163310 }, { "epoch": 1.77, "learning_rate": 3.5162482973341116e-05, "loss": 0.0064, "step": 163320 }, { "epoch": 1.77, "learning_rate": 3.514626710773821e-05, "loss": 0.0061, "step": 163330 }, { "epoch": 1.77, "learning_rate": 3.51300512421353e-05, "loss": 0.0064, "step": 163340 }, { "epoch": 1.77, "learning_rate": 3.5113835376532394e-05, "loss": 0.0087, "step": 163350 }, { "epoch": 1.77, "learning_rate": 3.509761951092949e-05, "loss": 0.0048, "step": 163360 }, { "epoch": 1.77, "learning_rate": 3.508140364532659e-05, "loss": 0.0075, "step": 163370 }, { "epoch": 1.77, "learning_rate": 3.506518777972368e-05, "loss": 0.0059, "step": 163380 }, { "epoch": 1.77, "learning_rate": 3.504897191412077e-05, "loss": 0.0057, "step": 163390 }, { "epoch": 1.77, "learning_rate": 3.5032756048517865e-05, "loss": 0.0071, "step": 163400 }, { "epoch": 1.77, "learning_rate": 3.501654018291496e-05, "loss": 0.006, "step": 163410 }, { "epoch": 1.77, "learning_rate": 3.500032431731205e-05, "loss": 0.0081, "step": 163420 }, { "epoch": 1.77, "learning_rate": 3.498410845170915e-05, "loss": 0.0072, "step": 163430 }, { "epoch": 1.77, "learning_rate": 3.496789258610624e-05, "loss": 0.006, "step": 163440 }, { "epoch": 1.77, "learning_rate": 3.4951676720503335e-05, "loss": 0.0063, "step": 163450 }, { "epoch": 1.77, "learning_rate": 3.493546085490043e-05, "loss": 0.0064, "step": 163460 }, { "epoch": 1.77, "learning_rate": 3.491924498929753e-05, "loss": 0.0063, "step": 163470 }, { "epoch": 1.77, "learning_rate": 3.490302912369462e-05, "loss": 0.0052, "step": 163480 }, { "epoch": 1.77, "learning_rate": 3.488681325809171e-05, "loss": 0.0052, "step": 163490 }, { "epoch": 1.77, "learning_rate": 3.487059739248881e-05, "loss": 0.007, "step": 163500 }, { "epoch": 1.77, "learning_rate": 3.4854381526885905e-05, "loss": 0.0059, "step": 163510 }, { "epoch": 1.77, "learning_rate": 3.4838165661283e-05, "loss": 0.0075, "step": 163520 }, { "epoch": 1.77, "learning_rate": 3.482194979568009e-05, "loss": 0.0089, "step": 163530 }, { "epoch": 1.77, "learning_rate": 3.4805733930077184e-05, "loss": 0.0051, "step": 163540 }, { "epoch": 1.77, "learning_rate": 3.4789518064474276e-05, "loss": 0.0055, "step": 163550 }, { "epoch": 1.77, "learning_rate": 3.4773302198871376e-05, "loss": 0.0045, "step": 163560 }, { "epoch": 1.77, "learning_rate": 3.475708633326847e-05, "loss": 0.0063, "step": 163570 }, { "epoch": 1.77, "learning_rate": 3.474087046766556e-05, "loss": 0.0075, "step": 163580 }, { "epoch": 1.77, "learning_rate": 3.4724654602062654e-05, "loss": 0.0069, "step": 163590 }, { "epoch": 1.77, "learning_rate": 3.470843873645975e-05, "loss": 0.0076, "step": 163600 }, { "epoch": 1.77, "learning_rate": 3.4692222870856846e-05, "loss": 0.0078, "step": 163610 }, { "epoch": 1.77, "learning_rate": 3.467600700525394e-05, "loss": 0.0063, "step": 163620 }, { "epoch": 1.77, "learning_rate": 3.465979113965103e-05, "loss": 0.0059, "step": 163630 }, { "epoch": 1.77, "learning_rate": 3.4643575274048125e-05, "loss": 0.0079, "step": 163640 }, { "epoch": 1.77, "learning_rate": 3.462735940844522e-05, "loss": 0.0071, "step": 163650 }, { "epoch": 1.77, "learning_rate": 3.461114354284232e-05, "loss": 0.0064, "step": 163660 }, { "epoch": 1.77, "learning_rate": 3.459492767723941e-05, "loss": 0.0074, "step": 163670 }, { "epoch": 1.77, "learning_rate": 3.45787118116365e-05, "loss": 0.0087, "step": 163680 }, { "epoch": 1.77, "learning_rate": 3.4562495946033595e-05, "loss": 0.0077, "step": 163690 }, { "epoch": 1.77, "learning_rate": 3.454628008043069e-05, "loss": 0.0084, "step": 163700 }, { "epoch": 1.77, "learning_rate": 3.453006421482778e-05, "loss": 0.0058, "step": 163710 }, { "epoch": 1.77, "learning_rate": 3.451384834922488e-05, "loss": 0.0062, "step": 163720 }, { "epoch": 1.77, "learning_rate": 3.449763248362197e-05, "loss": 0.0061, "step": 163730 }, { "epoch": 1.77, "learning_rate": 3.4481416618019066e-05, "loss": 0.0071, "step": 163740 }, { "epoch": 1.77, "learning_rate": 3.446520075241616e-05, "loss": 0.0072, "step": 163750 }, { "epoch": 1.77, "learning_rate": 3.444898488681325e-05, "loss": 0.0051, "step": 163760 }, { "epoch": 1.77, "learning_rate": 3.443276902121035e-05, "loss": 0.006, "step": 163770 }, { "epoch": 1.77, "learning_rate": 3.4416553155607443e-05, "loss": 0.0066, "step": 163780 }, { "epoch": 1.77, "learning_rate": 3.4400337290004536e-05, "loss": 0.0067, "step": 163790 }, { "epoch": 1.77, "learning_rate": 3.438412142440163e-05, "loss": 0.0078, "step": 163800 }, { "epoch": 1.77, "learning_rate": 3.436790555879872e-05, "loss": 0.0061, "step": 163810 }, { "epoch": 1.77, "learning_rate": 3.4351689693195814e-05, "loss": 0.0057, "step": 163820 }, { "epoch": 1.77, "learning_rate": 3.4335473827592914e-05, "loss": 0.006, "step": 163830 }, { "epoch": 1.77, "learning_rate": 3.431925796199001e-05, "loss": 0.0068, "step": 163840 }, { "epoch": 1.77, "learning_rate": 3.4303042096387106e-05, "loss": 0.0068, "step": 163850 }, { "epoch": 1.77, "learning_rate": 3.42868262307842e-05, "loss": 0.0072, "step": 163860 }, { "epoch": 1.77, "learning_rate": 3.427061036518129e-05, "loss": 0.0074, "step": 163870 }, { "epoch": 1.77, "learning_rate": 3.4254394499578384e-05, "loss": 0.0071, "step": 163880 }, { "epoch": 1.77, "learning_rate": 3.423817863397548e-05, "loss": 0.0065, "step": 163890 }, { "epoch": 1.77, "learning_rate": 3.422196276837258e-05, "loss": 0.0061, "step": 163900 }, { "epoch": 1.77, "learning_rate": 3.420574690276967e-05, "loss": 0.0057, "step": 163910 }, { "epoch": 1.77, "learning_rate": 3.418953103716676e-05, "loss": 0.0085, "step": 163920 }, { "epoch": 1.77, "learning_rate": 3.4173315171563855e-05, "loss": 0.0069, "step": 163930 }, { "epoch": 1.77, "learning_rate": 3.415709930596095e-05, "loss": 0.0062, "step": 163940 }, { "epoch": 1.77, "learning_rate": 3.414088344035805e-05, "loss": 0.0074, "step": 163950 }, { "epoch": 1.77, "learning_rate": 3.412466757475514e-05, "loss": 0.0074, "step": 163960 }, { "epoch": 1.77, "learning_rate": 3.410845170915223e-05, "loss": 0.0057, "step": 163970 }, { "epoch": 1.77, "learning_rate": 3.4092235843549325e-05, "loss": 0.0056, "step": 163980 }, { "epoch": 1.77, "learning_rate": 3.407601997794642e-05, "loss": 0.005, "step": 163990 }, { "epoch": 1.77, "learning_rate": 3.405980411234351e-05, "loss": 0.0069, "step": 164000 }, { "epoch": 1.77, "eval_cer": 0.9215086938469904, "eval_loss": 0.005612937733530998, "eval_runtime": 121.4334, "eval_samples_per_second": 16.47, "eval_steps_per_second": 4.117, "step": 164000 }, { "epoch": 1.77, "learning_rate": 3.404358824674061e-05, "loss": 0.0063, "step": 164010 }, { "epoch": 1.77, "learning_rate": 3.40273723811377e-05, "loss": 0.0055, "step": 164020 }, { "epoch": 1.77, "learning_rate": 3.4011156515534796e-05, "loss": 0.0069, "step": 164030 }, { "epoch": 1.77, "learning_rate": 3.399494064993189e-05, "loss": 0.0059, "step": 164040 }, { "epoch": 1.77, "learning_rate": 3.397872478432898e-05, "loss": 0.0072, "step": 164050 }, { "epoch": 1.77, "learning_rate": 3.396250891872608e-05, "loss": 0.007, "step": 164060 }, { "epoch": 1.77, "learning_rate": 3.3946293053123174e-05, "loss": 0.0089, "step": 164070 }, { "epoch": 1.77, "learning_rate": 3.3930077187520266e-05, "loss": 0.0084, "step": 164080 }, { "epoch": 1.77, "learning_rate": 3.391386132191736e-05, "loss": 0.0083, "step": 164090 }, { "epoch": 1.77, "learning_rate": 3.389764545631445e-05, "loss": 0.0085, "step": 164100 }, { "epoch": 1.77, "learning_rate": 3.3881429590711545e-05, "loss": 0.0059, "step": 164110 }, { "epoch": 1.77, "learning_rate": 3.3865213725108644e-05, "loss": 0.0088, "step": 164120 }, { "epoch": 1.77, "learning_rate": 3.384899785950574e-05, "loss": 0.0075, "step": 164130 }, { "epoch": 1.77, "learning_rate": 3.383278199390283e-05, "loss": 0.0071, "step": 164140 }, { "epoch": 1.77, "learning_rate": 3.381656612829992e-05, "loss": 0.0059, "step": 164150 }, { "epoch": 1.77, "learning_rate": 3.3800350262697015e-05, "loss": 0.0052, "step": 164160 }, { "epoch": 1.77, "learning_rate": 3.3784134397094115e-05, "loss": 0.008, "step": 164170 }, { "epoch": 1.77, "learning_rate": 3.376791853149121e-05, "loss": 0.0059, "step": 164180 }, { "epoch": 1.77, "learning_rate": 3.375170266588831e-05, "loss": 0.0061, "step": 164190 }, { "epoch": 1.78, "learning_rate": 3.37354868002854e-05, "loss": 0.0055, "step": 164200 }, { "epoch": 1.78, "learning_rate": 3.371927093468249e-05, "loss": 0.0066, "step": 164210 }, { "epoch": 1.78, "learning_rate": 3.3703055069079585e-05, "loss": 0.0085, "step": 164220 }, { "epoch": 1.78, "learning_rate": 3.368683920347668e-05, "loss": 0.0059, "step": 164230 }, { "epoch": 1.78, "learning_rate": 3.367062333787378e-05, "loss": 0.0058, "step": 164240 }, { "epoch": 1.78, "learning_rate": 3.365440747227087e-05, "loss": 0.0073, "step": 164250 }, { "epoch": 1.78, "learning_rate": 3.363819160666796e-05, "loss": 0.0075, "step": 164260 }, { "epoch": 1.78, "learning_rate": 3.3621975741065056e-05, "loss": 0.0068, "step": 164270 }, { "epoch": 1.78, "learning_rate": 3.360575987546215e-05, "loss": 0.0068, "step": 164280 }, { "epoch": 1.78, "learning_rate": 3.358954400985924e-05, "loss": 0.0053, "step": 164290 }, { "epoch": 1.78, "learning_rate": 3.357332814425634e-05, "loss": 0.0072, "step": 164300 }, { "epoch": 1.78, "learning_rate": 3.355711227865343e-05, "loss": 0.0064, "step": 164310 }, { "epoch": 1.78, "learning_rate": 3.3540896413050526e-05, "loss": 0.0067, "step": 164320 }, { "epoch": 1.78, "learning_rate": 3.352468054744762e-05, "loss": 0.0058, "step": 164330 }, { "epoch": 1.78, "learning_rate": 3.350846468184471e-05, "loss": 0.0077, "step": 164340 }, { "epoch": 1.78, "learning_rate": 3.349224881624181e-05, "loss": 0.0068, "step": 164350 }, { "epoch": 1.78, "learning_rate": 3.3476032950638904e-05, "loss": 0.0074, "step": 164360 }, { "epoch": 1.78, "learning_rate": 3.3459817085036e-05, "loss": 0.0043, "step": 164370 }, { "epoch": 1.78, "learning_rate": 3.344360121943309e-05, "loss": 0.0058, "step": 164380 }, { "epoch": 1.78, "learning_rate": 3.342738535383018e-05, "loss": 0.006, "step": 164390 }, { "epoch": 1.78, "learning_rate": 3.3411169488227275e-05, "loss": 0.0072, "step": 164400 }, { "epoch": 1.78, "learning_rate": 3.3394953622624374e-05, "loss": 0.0058, "step": 164410 }, { "epoch": 1.78, "learning_rate": 3.337873775702147e-05, "loss": 0.0082, "step": 164420 }, { "epoch": 1.78, "learning_rate": 3.336252189141856e-05, "loss": 0.0085, "step": 164430 }, { "epoch": 1.78, "learning_rate": 3.334630602581565e-05, "loss": 0.0066, "step": 164440 }, { "epoch": 1.78, "learning_rate": 3.3330090160212745e-05, "loss": 0.0086, "step": 164450 }, { "epoch": 1.78, "learning_rate": 3.3313874294609845e-05, "loss": 0.0085, "step": 164460 }, { "epoch": 1.78, "learning_rate": 3.329765842900694e-05, "loss": 0.007, "step": 164470 }, { "epoch": 1.78, "learning_rate": 3.328144256340403e-05, "loss": 0.0065, "step": 164480 }, { "epoch": 1.78, "learning_rate": 3.326522669780112e-05, "loss": 0.0071, "step": 164490 }, { "epoch": 1.78, "learning_rate": 3.3249010832198216e-05, "loss": 0.0073, "step": 164500 }, { "epoch": 1.78, "learning_rate": 3.3232794966595315e-05, "loss": 0.0062, "step": 164510 }, { "epoch": 1.78, "learning_rate": 3.321657910099241e-05, "loss": 0.0132, "step": 164520 }, { "epoch": 1.78, "learning_rate": 3.32003632353895e-05, "loss": 0.0067, "step": 164530 }, { "epoch": 1.78, "learning_rate": 3.31841473697866e-05, "loss": 0.0051, "step": 164540 }, { "epoch": 1.78, "learning_rate": 3.316793150418369e-05, "loss": 0.0062, "step": 164550 }, { "epoch": 1.78, "learning_rate": 3.3151715638580786e-05, "loss": 0.0051, "step": 164560 }, { "epoch": 1.78, "learning_rate": 3.313549977297788e-05, "loss": 0.006, "step": 164570 }, { "epoch": 1.78, "learning_rate": 3.311928390737497e-05, "loss": 0.0069, "step": 164580 }, { "epoch": 1.78, "learning_rate": 3.310306804177207e-05, "loss": 0.0075, "step": 164590 }, { "epoch": 1.78, "learning_rate": 3.3086852176169164e-05, "loss": 0.0069, "step": 164600 }, { "epoch": 1.78, "learning_rate": 3.3070636310566256e-05, "loss": 0.0075, "step": 164610 }, { "epoch": 1.78, "learning_rate": 3.305442044496335e-05, "loss": 0.007, "step": 164620 }, { "epoch": 1.78, "learning_rate": 3.303820457936044e-05, "loss": 0.0066, "step": 164630 }, { "epoch": 1.78, "learning_rate": 3.302198871375754e-05, "loss": 0.0054, "step": 164640 }, { "epoch": 1.78, "learning_rate": 3.3005772848154634e-05, "loss": 0.0053, "step": 164650 }, { "epoch": 1.78, "learning_rate": 3.298955698255173e-05, "loss": 0.0063, "step": 164660 }, { "epoch": 1.78, "learning_rate": 3.297334111694882e-05, "loss": 0.0079, "step": 164670 }, { "epoch": 1.78, "learning_rate": 3.295712525134591e-05, "loss": 0.006, "step": 164680 }, { "epoch": 1.78, "learning_rate": 3.2940909385743005e-05, "loss": 0.0064, "step": 164690 }, { "epoch": 1.78, "learning_rate": 3.2924693520140105e-05, "loss": 0.0066, "step": 164700 }, { "epoch": 1.78, "learning_rate": 3.29084776545372e-05, "loss": 0.0071, "step": 164710 }, { "epoch": 1.78, "learning_rate": 3.289226178893429e-05, "loss": 0.0057, "step": 164720 }, { "epoch": 1.78, "learning_rate": 3.287604592333138e-05, "loss": 0.0071, "step": 164730 }, { "epoch": 1.78, "learning_rate": 3.2859830057728476e-05, "loss": 0.0062, "step": 164740 }, { "epoch": 1.78, "learning_rate": 3.2843614192125575e-05, "loss": 0.0091, "step": 164750 }, { "epoch": 1.78, "learning_rate": 3.282739832652267e-05, "loss": 0.0065, "step": 164760 }, { "epoch": 1.78, "learning_rate": 3.281118246091976e-05, "loss": 0.0079, "step": 164770 }, { "epoch": 1.78, "learning_rate": 3.279496659531685e-05, "loss": 0.0056, "step": 164780 }, { "epoch": 1.78, "learning_rate": 3.2778750729713946e-05, "loss": 0.0042, "step": 164790 }, { "epoch": 1.78, "learning_rate": 3.2762534864111046e-05, "loss": 0.0075, "step": 164800 }, { "epoch": 1.78, "learning_rate": 3.274631899850814e-05, "loss": 0.0077, "step": 164810 }, { "epoch": 1.78, "learning_rate": 3.273010313290523e-05, "loss": 0.0071, "step": 164820 }, { "epoch": 1.78, "learning_rate": 3.2713887267302324e-05, "loss": 0.0054, "step": 164830 }, { "epoch": 1.78, "learning_rate": 3.2697671401699417e-05, "loss": 0.0085, "step": 164840 }, { "epoch": 1.78, "learning_rate": 3.268145553609651e-05, "loss": 0.0076, "step": 164850 }, { "epoch": 1.78, "learning_rate": 3.266523967049361e-05, "loss": 0.0076, "step": 164860 }, { "epoch": 1.78, "learning_rate": 3.26490238048907e-05, "loss": 0.0056, "step": 164870 }, { "epoch": 1.78, "learning_rate": 3.2632807939287794e-05, "loss": 0.0101, "step": 164880 }, { "epoch": 1.78, "learning_rate": 3.261659207368489e-05, "loss": 0.0057, "step": 164890 }, { "epoch": 1.78, "learning_rate": 3.2600376208081987e-05, "loss": 0.0069, "step": 164900 }, { "epoch": 1.78, "learning_rate": 3.258416034247908e-05, "loss": 0.0052, "step": 164910 }, { "epoch": 1.78, "learning_rate": 3.256794447687617e-05, "loss": 0.0062, "step": 164920 }, { "epoch": 1.78, "learning_rate": 3.255172861127327e-05, "loss": 0.0079, "step": 164930 }, { "epoch": 1.78, "learning_rate": 3.2535512745670364e-05, "loss": 0.0057, "step": 164940 }, { "epoch": 1.78, "learning_rate": 3.251929688006746e-05, "loss": 0.0068, "step": 164950 }, { "epoch": 1.78, "learning_rate": 3.250308101446455e-05, "loss": 0.0078, "step": 164960 }, { "epoch": 1.78, "learning_rate": 3.248686514886164e-05, "loss": 0.0062, "step": 164970 }, { "epoch": 1.78, "learning_rate": 3.2470649283258735e-05, "loss": 0.0077, "step": 164980 }, { "epoch": 1.78, "learning_rate": 3.2454433417655835e-05, "loss": 0.0057, "step": 164990 }, { "epoch": 1.78, "learning_rate": 3.243821755205293e-05, "loss": 0.0075, "step": 165000 }, { "epoch": 1.78, "eval_cer": 0.9215251973031615, "eval_loss": 0.005625674035400152, "eval_runtime": 121.2135, "eval_samples_per_second": 16.5, "eval_steps_per_second": 4.125, "step": 165000 }, { "epoch": 1.78, "learning_rate": 3.242200168645002e-05, "loss": 0.0093, "step": 165010 }, { "epoch": 1.78, "learning_rate": 3.240578582084711e-05, "loss": 0.0081, "step": 165020 }, { "epoch": 1.78, "learning_rate": 3.2389569955244206e-05, "loss": 0.0079, "step": 165030 }, { "epoch": 1.78, "learning_rate": 3.2373354089641305e-05, "loss": 0.0071, "step": 165040 }, { "epoch": 1.78, "learning_rate": 3.23571382240384e-05, "loss": 0.0068, "step": 165050 }, { "epoch": 1.78, "learning_rate": 3.234092235843549e-05, "loss": 0.0072, "step": 165060 }, { "epoch": 1.78, "learning_rate": 3.2324706492832584e-05, "loss": 0.0063, "step": 165070 }, { "epoch": 1.78, "learning_rate": 3.2308490627229676e-05, "loss": 0.0071, "step": 165080 }, { "epoch": 1.78, "learning_rate": 3.2292274761626776e-05, "loss": 0.0053, "step": 165090 }, { "epoch": 1.78, "learning_rate": 3.227605889602387e-05, "loss": 0.0059, "step": 165100 }, { "epoch": 1.78, "learning_rate": 3.225984303042096e-05, "loss": 0.0046, "step": 165110 }, { "epoch": 1.79, "learning_rate": 3.2243627164818054e-05, "loss": 0.0059, "step": 165120 }, { "epoch": 1.79, "learning_rate": 3.222741129921515e-05, "loss": 0.0068, "step": 165130 }, { "epoch": 1.79, "learning_rate": 3.221119543361224e-05, "loss": 0.0051, "step": 165140 }, { "epoch": 1.79, "learning_rate": 3.219497956800934e-05, "loss": 0.006, "step": 165150 }, { "epoch": 1.79, "learning_rate": 3.217876370240643e-05, "loss": 0.0056, "step": 165160 }, { "epoch": 1.79, "learning_rate": 3.2162547836803525e-05, "loss": 0.0066, "step": 165170 }, { "epoch": 1.79, "learning_rate": 3.214633197120062e-05, "loss": 0.0053, "step": 165180 }, { "epoch": 1.79, "learning_rate": 3.213011610559771e-05, "loss": 0.0053, "step": 165190 }, { "epoch": 1.79, "learning_rate": 3.211390023999481e-05, "loss": 0.0073, "step": 165200 }, { "epoch": 1.79, "learning_rate": 3.20976843743919e-05, "loss": 0.0067, "step": 165210 }, { "epoch": 1.79, "learning_rate": 3.2081468508788995e-05, "loss": 0.0072, "step": 165220 }, { "epoch": 1.79, "learning_rate": 3.206525264318609e-05, "loss": 0.0089, "step": 165230 }, { "epoch": 1.79, "learning_rate": 3.204903677758318e-05, "loss": 0.0082, "step": 165240 }, { "epoch": 1.79, "learning_rate": 3.203282091198028e-05, "loss": 0.0076, "step": 165250 }, { "epoch": 1.79, "learning_rate": 3.201660504637737e-05, "loss": 0.0069, "step": 165260 }, { "epoch": 1.79, "learning_rate": 3.2000389180774466e-05, "loss": 0.0064, "step": 165270 }, { "epoch": 1.79, "learning_rate": 3.1984173315171565e-05, "loss": 0.0043, "step": 165280 }, { "epoch": 1.79, "learning_rate": 3.196795744956866e-05, "loss": 0.0076, "step": 165290 }, { "epoch": 1.79, "learning_rate": 3.195174158396575e-05, "loss": 0.0059, "step": 165300 }, { "epoch": 1.79, "learning_rate": 3.193552571836284e-05, "loss": 0.0071, "step": 165310 }, { "epoch": 1.79, "learning_rate": 3.1919309852759936e-05, "loss": 0.0061, "step": 165320 }, { "epoch": 1.79, "learning_rate": 3.1903093987157036e-05, "loss": 0.0085, "step": 165330 }, { "epoch": 1.79, "learning_rate": 3.188687812155413e-05, "loss": 0.0081, "step": 165340 }, { "epoch": 1.79, "learning_rate": 3.187066225595122e-05, "loss": 0.0064, "step": 165350 }, { "epoch": 1.79, "learning_rate": 3.1854446390348314e-05, "loss": 0.0049, "step": 165360 }, { "epoch": 1.79, "learning_rate": 3.1838230524745406e-05, "loss": 0.0089, "step": 165370 }, { "epoch": 1.79, "learning_rate": 3.1822014659142506e-05, "loss": 0.0052, "step": 165380 }, { "epoch": 1.79, "learning_rate": 3.18057987935396e-05, "loss": 0.0079, "step": 165390 }, { "epoch": 1.79, "learning_rate": 3.178958292793669e-05, "loss": 0.0065, "step": 165400 }, { "epoch": 1.79, "learning_rate": 3.1773367062333784e-05, "loss": 0.005, "step": 165410 }, { "epoch": 1.79, "learning_rate": 3.175715119673088e-05, "loss": 0.0061, "step": 165420 }, { "epoch": 1.79, "learning_rate": 3.174093533112797e-05, "loss": 0.0078, "step": 165430 }, { "epoch": 1.79, "learning_rate": 3.172471946552507e-05, "loss": 0.0072, "step": 165440 }, { "epoch": 1.79, "learning_rate": 3.170850359992216e-05, "loss": 0.0075, "step": 165450 }, { "epoch": 1.79, "learning_rate": 3.1692287734319255e-05, "loss": 0.0101, "step": 165460 }, { "epoch": 1.79, "learning_rate": 3.167607186871635e-05, "loss": 0.0056, "step": 165470 }, { "epoch": 1.79, "learning_rate": 3.165985600311344e-05, "loss": 0.0073, "step": 165480 }, { "epoch": 1.79, "learning_rate": 3.164364013751054e-05, "loss": 0.0059, "step": 165490 }, { "epoch": 1.79, "learning_rate": 3.162742427190763e-05, "loss": 0.0082, "step": 165500 }, { "epoch": 1.79, "learning_rate": 3.1611208406304725e-05, "loss": 0.0101, "step": 165510 }, { "epoch": 1.79, "learning_rate": 3.159499254070182e-05, "loss": 0.0066, "step": 165520 }, { "epoch": 1.79, "learning_rate": 3.157877667509891e-05, "loss": 0.0059, "step": 165530 }, { "epoch": 1.79, "learning_rate": 3.156256080949601e-05, "loss": 0.0059, "step": 165540 }, { "epoch": 1.79, "learning_rate": 3.15463449438931e-05, "loss": 0.0068, "step": 165550 }, { "epoch": 1.79, "learning_rate": 3.1530129078290196e-05, "loss": 0.0072, "step": 165560 }, { "epoch": 1.79, "learning_rate": 3.151391321268729e-05, "loss": 0.0076, "step": 165570 }, { "epoch": 1.79, "learning_rate": 3.149769734708438e-05, "loss": 0.0052, "step": 165580 }, { "epoch": 1.79, "learning_rate": 3.1481481481481474e-05, "loss": 0.0048, "step": 165590 }, { "epoch": 1.79, "learning_rate": 3.1465265615878573e-05, "loss": 0.0084, "step": 165600 }, { "epoch": 1.79, "learning_rate": 3.1449049750275666e-05, "loss": 0.0076, "step": 165610 }, { "epoch": 1.79, "learning_rate": 3.1432833884672766e-05, "loss": 0.006, "step": 165620 }, { "epoch": 1.79, "learning_rate": 3.141661801906986e-05, "loss": 0.0078, "step": 165630 }, { "epoch": 1.79, "learning_rate": 3.140040215346695e-05, "loss": 0.0053, "step": 165640 }, { "epoch": 1.79, "learning_rate": 3.1384186287864044e-05, "loss": 0.0066, "step": 165650 }, { "epoch": 1.79, "learning_rate": 3.136797042226114e-05, "loss": 0.0052, "step": 165660 }, { "epoch": 1.79, "learning_rate": 3.1351754556658236e-05, "loss": 0.0066, "step": 165670 }, { "epoch": 1.79, "learning_rate": 3.133553869105533e-05, "loss": 0.008, "step": 165680 }, { "epoch": 1.79, "learning_rate": 3.131932282545242e-05, "loss": 0.0072, "step": 165690 }, { "epoch": 1.79, "learning_rate": 3.1303106959849514e-05, "loss": 0.0062, "step": 165700 }, { "epoch": 1.79, "learning_rate": 3.128689109424661e-05, "loss": 0.0061, "step": 165710 }, { "epoch": 1.79, "learning_rate": 3.12706752286437e-05, "loss": 0.0072, "step": 165720 }, { "epoch": 1.79, "learning_rate": 3.12544593630408e-05, "loss": 0.0081, "step": 165730 }, { "epoch": 1.79, "learning_rate": 3.123824349743789e-05, "loss": 0.0081, "step": 165740 }, { "epoch": 1.79, "learning_rate": 3.1222027631834985e-05, "loss": 0.0063, "step": 165750 }, { "epoch": 1.79, "learning_rate": 3.120581176623208e-05, "loss": 0.0073, "step": 165760 }, { "epoch": 1.79, "learning_rate": 3.118959590062917e-05, "loss": 0.0082, "step": 165770 }, { "epoch": 1.79, "learning_rate": 3.117338003502627e-05, "loss": 0.0069, "step": 165780 }, { "epoch": 1.79, "learning_rate": 3.115716416942336e-05, "loss": 0.0056, "step": 165790 }, { "epoch": 1.79, "learning_rate": 3.1140948303820455e-05, "loss": 0.007, "step": 165800 }, { "epoch": 1.79, "learning_rate": 3.112473243821755e-05, "loss": 0.0061, "step": 165810 }, { "epoch": 1.79, "learning_rate": 3.110851657261464e-05, "loss": 0.0063, "step": 165820 }, { "epoch": 1.79, "learning_rate": 3.109230070701174e-05, "loss": 0.0051, "step": 165830 }, { "epoch": 1.79, "learning_rate": 3.107608484140883e-05, "loss": 0.0066, "step": 165840 }, { "epoch": 1.79, "learning_rate": 3.1059868975805926e-05, "loss": 0.0062, "step": 165850 }, { "epoch": 1.79, "learning_rate": 3.104365311020302e-05, "loss": 0.0066, "step": 165860 }, { "epoch": 1.79, "learning_rate": 3.102743724460011e-05, "loss": 0.0089, "step": 165870 }, { "epoch": 1.79, "learning_rate": 3.1011221378997204e-05, "loss": 0.0083, "step": 165880 }, { "epoch": 1.79, "learning_rate": 3.0995005513394304e-05, "loss": 0.0067, "step": 165890 }, { "epoch": 1.79, "learning_rate": 3.0978789647791396e-05, "loss": 0.0065, "step": 165900 }, { "epoch": 1.79, "learning_rate": 3.096257378218849e-05, "loss": 0.0056, "step": 165910 }, { "epoch": 1.79, "learning_rate": 3.094635791658558e-05, "loss": 0.0079, "step": 165920 }, { "epoch": 1.79, "learning_rate": 3.0930142050982675e-05, "loss": 0.0079, "step": 165930 }, { "epoch": 1.79, "learning_rate": 3.0913926185379774e-05, "loss": 0.007, "step": 165940 }, { "epoch": 1.79, "learning_rate": 3.089771031977687e-05, "loss": 0.0061, "step": 165950 }, { "epoch": 1.79, "learning_rate": 3.088149445417396e-05, "loss": 0.0061, "step": 165960 }, { "epoch": 1.79, "learning_rate": 3.086527858857105e-05, "loss": 0.0077, "step": 165970 }, { "epoch": 1.79, "learning_rate": 3.084906272296815e-05, "loss": 0.0063, "step": 165980 }, { "epoch": 1.79, "learning_rate": 3.0832846857365245e-05, "loss": 0.007, "step": 165990 }, { "epoch": 1.79, "learning_rate": 3.081663099176234e-05, "loss": 0.0067, "step": 166000 }, { "epoch": 1.79, "eval_cer": 0.9215173798765541, "eval_loss": 0.005517047364264727, "eval_runtime": 121.2305, "eval_samples_per_second": 16.497, "eval_steps_per_second": 4.124, "step": 166000 }, { "epoch": 1.79, "learning_rate": 3.080041512615943e-05, "loss": 0.0067, "step": 166010 }, { "epoch": 1.79, "learning_rate": 3.078419926055653e-05, "loss": 0.0067, "step": 166020 }, { "epoch": 1.79, "learning_rate": 3.076798339495362e-05, "loss": 0.0067, "step": 166030 }, { "epoch": 1.79, "learning_rate": 3.0751767529350715e-05, "loss": 0.0071, "step": 166040 }, { "epoch": 1.8, "learning_rate": 3.073555166374781e-05, "loss": 0.0073, "step": 166050 }, { "epoch": 1.8, "learning_rate": 3.07193357981449e-05, "loss": 0.0069, "step": 166060 }, { "epoch": 1.8, "learning_rate": 3.0703119932542e-05, "loss": 0.008, "step": 166070 }, { "epoch": 1.8, "learning_rate": 3.068690406693909e-05, "loss": 0.0082, "step": 166080 }, { "epoch": 1.8, "learning_rate": 3.0670688201336186e-05, "loss": 0.006, "step": 166090 }, { "epoch": 1.8, "learning_rate": 3.065447233573328e-05, "loss": 0.0056, "step": 166100 }, { "epoch": 1.8, "learning_rate": 3.063825647013037e-05, "loss": 0.0075, "step": 166110 }, { "epoch": 1.8, "learning_rate": 3.062204060452747e-05, "loss": 0.0056, "step": 166120 }, { "epoch": 1.8, "learning_rate": 3.0605824738924563e-05, "loss": 0.0092, "step": 166130 }, { "epoch": 1.8, "learning_rate": 3.0589608873321656e-05, "loss": 0.0056, "step": 166140 }, { "epoch": 1.8, "learning_rate": 3.057339300771875e-05, "loss": 0.0061, "step": 166150 }, { "epoch": 1.8, "learning_rate": 3.055717714211584e-05, "loss": 0.0062, "step": 166160 }, { "epoch": 1.8, "learning_rate": 3.0540961276512934e-05, "loss": 0.006, "step": 166170 }, { "epoch": 1.8, "learning_rate": 3.0524745410910034e-05, "loss": 0.0052, "step": 166180 }, { "epoch": 1.8, "learning_rate": 3.0508529545307127e-05, "loss": 0.0069, "step": 166190 }, { "epoch": 1.8, "learning_rate": 3.049231367970422e-05, "loss": 0.0096, "step": 166200 }, { "epoch": 1.8, "learning_rate": 3.0476097814101312e-05, "loss": 0.0065, "step": 166210 }, { "epoch": 1.8, "learning_rate": 3.0459881948498408e-05, "loss": 0.009, "step": 166220 }, { "epoch": 1.8, "learning_rate": 3.04436660828955e-05, "loss": 0.0056, "step": 166230 }, { "epoch": 1.8, "learning_rate": 3.0427450217292597e-05, "loss": 0.0083, "step": 166240 }, { "epoch": 1.8, "learning_rate": 3.041123435168969e-05, "loss": 0.0051, "step": 166250 }, { "epoch": 1.8, "learning_rate": 3.0395018486086783e-05, "loss": 0.0081, "step": 166260 }, { "epoch": 1.8, "learning_rate": 3.037880262048388e-05, "loss": 0.0069, "step": 166270 }, { "epoch": 1.8, "learning_rate": 3.036258675488097e-05, "loss": 0.0068, "step": 166280 }, { "epoch": 1.8, "learning_rate": 3.0346370889278064e-05, "loss": 0.0076, "step": 166290 }, { "epoch": 1.8, "learning_rate": 3.033015502367516e-05, "loss": 0.0056, "step": 166300 }, { "epoch": 1.8, "learning_rate": 3.0313939158072253e-05, "loss": 0.0082, "step": 166310 }, { "epoch": 1.8, "learning_rate": 3.0297723292469346e-05, "loss": 0.0068, "step": 166320 }, { "epoch": 1.8, "learning_rate": 3.0281507426866442e-05, "loss": 0.0061, "step": 166330 }, { "epoch": 1.8, "learning_rate": 3.0265291561263538e-05, "loss": 0.0055, "step": 166340 }, { "epoch": 1.8, "learning_rate": 3.0249075695660634e-05, "loss": 0.0056, "step": 166350 }, { "epoch": 1.8, "learning_rate": 3.0232859830057727e-05, "loss": 0.0063, "step": 166360 }, { "epoch": 1.8, "learning_rate": 3.0216643964454823e-05, "loss": 0.0078, "step": 166370 }, { "epoch": 1.8, "learning_rate": 3.0200428098851916e-05, "loss": 0.005, "step": 166380 }, { "epoch": 1.8, "learning_rate": 3.018421223324901e-05, "loss": 0.0086, "step": 166390 }, { "epoch": 1.8, "learning_rate": 3.0167996367646105e-05, "loss": 0.0062, "step": 166400 }, { "epoch": 1.8, "learning_rate": 3.0151780502043198e-05, "loss": 0.0057, "step": 166410 }, { "epoch": 1.8, "learning_rate": 3.013556463644029e-05, "loss": 0.0048, "step": 166420 }, { "epoch": 1.8, "learning_rate": 3.0119348770837386e-05, "loss": 0.0068, "step": 166430 }, { "epoch": 1.8, "learning_rate": 3.010313290523448e-05, "loss": 0.0073, "step": 166440 }, { "epoch": 1.8, "learning_rate": 3.0086917039631575e-05, "loss": 0.0061, "step": 166450 }, { "epoch": 1.8, "learning_rate": 3.0070701174028668e-05, "loss": 0.0081, "step": 166460 }, { "epoch": 1.8, "learning_rate": 3.005448530842576e-05, "loss": 0.007, "step": 166470 }, { "epoch": 1.8, "learning_rate": 3.0038269442822857e-05, "loss": 0.0065, "step": 166480 }, { "epoch": 1.8, "learning_rate": 3.002205357721995e-05, "loss": 0.0061, "step": 166490 }, { "epoch": 1.8, "learning_rate": 3.0005837711617042e-05, "loss": 0.0069, "step": 166500 }, { "epoch": 1.8, "learning_rate": 2.998962184601414e-05, "loss": 0.0063, "step": 166510 }, { "epoch": 1.8, "learning_rate": 2.997340598041123e-05, "loss": 0.0069, "step": 166520 }, { "epoch": 1.8, "learning_rate": 2.9957190114808327e-05, "loss": 0.0061, "step": 166530 }, { "epoch": 1.8, "learning_rate": 2.994097424920542e-05, "loss": 0.0065, "step": 166540 }, { "epoch": 1.8, "learning_rate": 2.9924758383602513e-05, "loss": 0.0089, "step": 166550 }, { "epoch": 1.8, "learning_rate": 2.990854251799961e-05, "loss": 0.006, "step": 166560 }, { "epoch": 1.8, "learning_rate": 2.9892326652396702e-05, "loss": 0.0071, "step": 166570 }, { "epoch": 1.8, "learning_rate": 2.9876110786793794e-05, "loss": 0.0061, "step": 166580 }, { "epoch": 1.8, "learning_rate": 2.985989492119089e-05, "loss": 0.0059, "step": 166590 }, { "epoch": 1.8, "learning_rate": 2.9843679055587983e-05, "loss": 0.0088, "step": 166600 }, { "epoch": 1.8, "learning_rate": 2.9827463189985076e-05, "loss": 0.0071, "step": 166610 }, { "epoch": 1.8, "learning_rate": 2.9811247324382172e-05, "loss": 0.006, "step": 166620 }, { "epoch": 1.8, "learning_rate": 2.9795031458779265e-05, "loss": 0.0056, "step": 166630 }, { "epoch": 1.8, "learning_rate": 2.977881559317636e-05, "loss": 0.006, "step": 166640 }, { "epoch": 1.8, "learning_rate": 2.9762599727573454e-05, "loss": 0.0057, "step": 166650 }, { "epoch": 1.8, "learning_rate": 2.9746383861970547e-05, "loss": 0.0081, "step": 166660 }, { "epoch": 1.8, "learning_rate": 2.9730167996367643e-05, "loss": 0.0064, "step": 166670 }, { "epoch": 1.8, "learning_rate": 2.9713952130764735e-05, "loss": 0.0053, "step": 166680 }, { "epoch": 1.8, "learning_rate": 2.9697736265161828e-05, "loss": 0.0048, "step": 166690 }, { "epoch": 1.8, "learning_rate": 2.9681520399558928e-05, "loss": 0.0059, "step": 166700 }, { "epoch": 1.8, "learning_rate": 2.966530453395602e-05, "loss": 0.0059, "step": 166710 }, { "epoch": 1.8, "learning_rate": 2.9649088668353117e-05, "loss": 0.0074, "step": 166720 }, { "epoch": 1.8, "learning_rate": 2.963287280275021e-05, "loss": 0.006, "step": 166730 }, { "epoch": 1.8, "learning_rate": 2.9616656937147305e-05, "loss": 0.0069, "step": 166740 }, { "epoch": 1.8, "learning_rate": 2.9600441071544398e-05, "loss": 0.0067, "step": 166750 }, { "epoch": 1.8, "learning_rate": 2.958422520594149e-05, "loss": 0.0063, "step": 166760 }, { "epoch": 1.8, "learning_rate": 2.9568009340338587e-05, "loss": 0.0069, "step": 166770 }, { "epoch": 1.8, "learning_rate": 2.955179347473568e-05, "loss": 0.0071, "step": 166780 }, { "epoch": 1.8, "learning_rate": 2.9535577609132773e-05, "loss": 0.0094, "step": 166790 }, { "epoch": 1.8, "learning_rate": 2.951936174352987e-05, "loss": 0.0062, "step": 166800 }, { "epoch": 1.8, "learning_rate": 2.950314587792696e-05, "loss": 0.007, "step": 166810 }, { "epoch": 1.8, "learning_rate": 2.9486930012324058e-05, "loss": 0.0074, "step": 166820 }, { "epoch": 1.8, "learning_rate": 2.947071414672115e-05, "loss": 0.0072, "step": 166830 }, { "epoch": 1.8, "learning_rate": 2.9454498281118243e-05, "loss": 0.0063, "step": 166840 }, { "epoch": 1.8, "learning_rate": 2.943828241551534e-05, "loss": 0.0058, "step": 166850 }, { "epoch": 1.8, "learning_rate": 2.9422066549912432e-05, "loss": 0.0083, "step": 166860 }, { "epoch": 1.8, "learning_rate": 2.9405850684309525e-05, "loss": 0.0072, "step": 166870 }, { "epoch": 1.8, "learning_rate": 2.938963481870662e-05, "loss": 0.0063, "step": 166880 }, { "epoch": 1.8, "learning_rate": 2.9373418953103714e-05, "loss": 0.0072, "step": 166890 }, { "epoch": 1.8, "learning_rate": 2.9357203087500806e-05, "loss": 0.0057, "step": 166900 }, { "epoch": 1.8, "learning_rate": 2.9340987221897902e-05, "loss": 0.0093, "step": 166910 }, { "epoch": 1.8, "learning_rate": 2.9324771356294995e-05, "loss": 0.0073, "step": 166920 }, { "epoch": 1.8, "learning_rate": 2.930855549069209e-05, "loss": 0.0081, "step": 166930 }, { "epoch": 1.8, "learning_rate": 2.9292339625089184e-05, "loss": 0.0071, "step": 166940 }, { "epoch": 1.8, "learning_rate": 2.9276123759486277e-05, "loss": 0.0047, "step": 166950 }, { "epoch": 1.8, "learning_rate": 2.9259907893883373e-05, "loss": 0.0075, "step": 166960 }, { "epoch": 1.81, "learning_rate": 2.9243692028280466e-05, "loss": 0.0055, "step": 166970 }, { "epoch": 1.81, "learning_rate": 2.922747616267756e-05, "loss": 0.0068, "step": 166980 }, { "epoch": 1.81, "learning_rate": 2.9211260297074655e-05, "loss": 0.0062, "step": 166990 }, { "epoch": 1.81, "learning_rate": 2.9195044431471747e-05, "loss": 0.0069, "step": 167000 }, { "epoch": 1.81, "eval_cer": 0.9215278031120306, "eval_loss": 0.0055626993998885155, "eval_runtime": 121.1369, "eval_samples_per_second": 16.51, "eval_steps_per_second": 4.128, "step": 167000 }, { "epoch": 1.81, "learning_rate": 2.9178828565868843e-05, "loss": 0.0062, "step": 167010 }, { "epoch": 1.81, "learning_rate": 2.9162612700265936e-05, "loss": 0.008, "step": 167020 }, { "epoch": 1.81, "learning_rate": 2.914639683466303e-05, "loss": 0.0051, "step": 167030 }, { "epoch": 1.81, "learning_rate": 2.9130180969060125e-05, "loss": 0.0071, "step": 167040 }, { "epoch": 1.81, "learning_rate": 2.9113965103457218e-05, "loss": 0.007, "step": 167050 }, { "epoch": 1.81, "learning_rate": 2.9097749237854317e-05, "loss": 0.0062, "step": 167060 }, { "epoch": 1.81, "learning_rate": 2.908153337225141e-05, "loss": 0.0072, "step": 167070 }, { "epoch": 1.81, "learning_rate": 2.9065317506648503e-05, "loss": 0.0071, "step": 167080 }, { "epoch": 1.81, "learning_rate": 2.90491016410456e-05, "loss": 0.0074, "step": 167090 }, { "epoch": 1.81, "learning_rate": 2.903288577544269e-05, "loss": 0.0053, "step": 167100 }, { "epoch": 1.81, "learning_rate": 2.9016669909839788e-05, "loss": 0.0046, "step": 167110 }, { "epoch": 1.81, "learning_rate": 2.900045404423688e-05, "loss": 0.007, "step": 167120 }, { "epoch": 1.81, "learning_rate": 2.8984238178633973e-05, "loss": 0.0062, "step": 167130 }, { "epoch": 1.81, "learning_rate": 2.896802231303107e-05, "loss": 0.0065, "step": 167140 }, { "epoch": 1.81, "learning_rate": 2.8951806447428162e-05, "loss": 0.0056, "step": 167150 }, { "epoch": 1.81, "learning_rate": 2.8935590581825255e-05, "loss": 0.0049, "step": 167160 }, { "epoch": 1.81, "learning_rate": 2.891937471622235e-05, "loss": 0.009, "step": 167170 }, { "epoch": 1.81, "learning_rate": 2.8903158850619444e-05, "loss": 0.0068, "step": 167180 }, { "epoch": 1.81, "learning_rate": 2.8886942985016537e-05, "loss": 0.007, "step": 167190 }, { "epoch": 1.81, "learning_rate": 2.8870727119413633e-05, "loss": 0.0061, "step": 167200 }, { "epoch": 1.81, "learning_rate": 2.8854511253810725e-05, "loss": 0.0062, "step": 167210 }, { "epoch": 1.81, "learning_rate": 2.883829538820782e-05, "loss": 0.0079, "step": 167220 }, { "epoch": 1.81, "learning_rate": 2.8822079522604914e-05, "loss": 0.0064, "step": 167230 }, { "epoch": 1.81, "learning_rate": 2.8805863657002007e-05, "loss": 0.0079, "step": 167240 }, { "epoch": 1.81, "learning_rate": 2.8789647791399103e-05, "loss": 0.0058, "step": 167250 }, { "epoch": 1.81, "learning_rate": 2.8773431925796196e-05, "loss": 0.0066, "step": 167260 }, { "epoch": 1.81, "learning_rate": 2.875721606019329e-05, "loss": 0.0091, "step": 167270 }, { "epoch": 1.81, "learning_rate": 2.8741000194590385e-05, "loss": 0.005, "step": 167280 }, { "epoch": 1.81, "learning_rate": 2.8724784328987478e-05, "loss": 0.0063, "step": 167290 }, { "epoch": 1.81, "learning_rate": 2.8708568463384574e-05, "loss": 0.0072, "step": 167300 }, { "epoch": 1.81, "learning_rate": 2.8692352597781666e-05, "loss": 0.0073, "step": 167310 }, { "epoch": 1.81, "learning_rate": 2.867613673217876e-05, "loss": 0.0055, "step": 167320 }, { "epoch": 1.81, "learning_rate": 2.8659920866575855e-05, "loss": 0.0053, "step": 167330 }, { "epoch": 1.81, "learning_rate": 2.8643705000972948e-05, "loss": 0.0056, "step": 167340 }, { "epoch": 1.81, "learning_rate": 2.862748913537004e-05, "loss": 0.0087, "step": 167350 }, { "epoch": 1.81, "learning_rate": 2.8611273269767137e-05, "loss": 0.0069, "step": 167360 }, { "epoch": 1.81, "learning_rate": 2.859505740416423e-05, "loss": 0.0073, "step": 167370 }, { "epoch": 1.81, "learning_rate": 2.8578841538561326e-05, "loss": 0.0069, "step": 167380 }, { "epoch": 1.81, "learning_rate": 2.856262567295842e-05, "loss": 0.0065, "step": 167390 }, { "epoch": 1.81, "learning_rate": 2.854640980735551e-05, "loss": 0.0064, "step": 167400 }, { "epoch": 1.81, "learning_rate": 2.8530193941752607e-05, "loss": 0.0053, "step": 167410 }, { "epoch": 1.81, "learning_rate": 2.8513978076149704e-05, "loss": 0.0062, "step": 167420 }, { "epoch": 1.81, "learning_rate": 2.84977622105468e-05, "loss": 0.0087, "step": 167430 }, { "epoch": 1.81, "learning_rate": 2.8481546344943892e-05, "loss": 0.0084, "step": 167440 }, { "epoch": 1.81, "learning_rate": 2.8465330479340985e-05, "loss": 0.0058, "step": 167450 }, { "epoch": 1.81, "learning_rate": 2.844911461373808e-05, "loss": 0.0078, "step": 167460 }, { "epoch": 1.81, "learning_rate": 2.8432898748135174e-05, "loss": 0.0075, "step": 167470 }, { "epoch": 1.81, "learning_rate": 2.841668288253227e-05, "loss": 0.0086, "step": 167480 }, { "epoch": 1.81, "learning_rate": 2.8400467016929363e-05, "loss": 0.0052, "step": 167490 }, { "epoch": 1.81, "learning_rate": 2.8384251151326456e-05, "loss": 0.0046, "step": 167500 }, { "epoch": 1.81, "learning_rate": 2.8368035285723552e-05, "loss": 0.0061, "step": 167510 }, { "epoch": 1.81, "learning_rate": 2.8351819420120644e-05, "loss": 0.0065, "step": 167520 }, { "epoch": 1.81, "learning_rate": 2.8335603554517737e-05, "loss": 0.0049, "step": 167530 }, { "epoch": 1.81, "learning_rate": 2.8319387688914833e-05, "loss": 0.007, "step": 167540 }, { "epoch": 1.81, "learning_rate": 2.8303171823311926e-05, "loss": 0.0072, "step": 167550 }, { "epoch": 1.81, "learning_rate": 2.828695595770902e-05, "loss": 0.0058, "step": 167560 }, { "epoch": 1.81, "learning_rate": 2.8270740092106115e-05, "loss": 0.0061, "step": 167570 }, { "epoch": 1.81, "learning_rate": 2.8254524226503208e-05, "loss": 0.006, "step": 167580 }, { "epoch": 1.81, "learning_rate": 2.8238308360900304e-05, "loss": 0.0058, "step": 167590 }, { "epoch": 1.81, "learning_rate": 2.8222092495297397e-05, "loss": 0.0068, "step": 167600 }, { "epoch": 1.81, "learning_rate": 2.820587662969449e-05, "loss": 0.0057, "step": 167610 }, { "epoch": 1.81, "learning_rate": 2.8189660764091585e-05, "loss": 0.0061, "step": 167620 }, { "epoch": 1.81, "learning_rate": 2.8173444898488678e-05, "loss": 0.007, "step": 167630 }, { "epoch": 1.81, "learning_rate": 2.815722903288577e-05, "loss": 0.0056, "step": 167640 }, { "epoch": 1.81, "learning_rate": 2.8141013167282867e-05, "loss": 0.0079, "step": 167650 }, { "epoch": 1.81, "learning_rate": 2.812479730167996e-05, "loss": 0.0052, "step": 167660 }, { "epoch": 1.81, "learning_rate": 2.8108581436077056e-05, "loss": 0.0055, "step": 167670 }, { "epoch": 1.81, "learning_rate": 2.809236557047415e-05, "loss": 0.0057, "step": 167680 }, { "epoch": 1.81, "learning_rate": 2.807614970487124e-05, "loss": 0.0079, "step": 167690 }, { "epoch": 1.81, "learning_rate": 2.8059933839268338e-05, "loss": 0.0095, "step": 167700 }, { "epoch": 1.81, "learning_rate": 2.804371797366543e-05, "loss": 0.0063, "step": 167710 }, { "epoch": 1.81, "learning_rate": 2.8027502108062523e-05, "loss": 0.0074, "step": 167720 }, { "epoch": 1.81, "learning_rate": 2.801128624245962e-05, "loss": 0.0075, "step": 167730 }, { "epoch": 1.81, "learning_rate": 2.7995070376856712e-05, "loss": 0.0069, "step": 167740 }, { "epoch": 1.81, "learning_rate": 2.7978854511253808e-05, "loss": 0.0047, "step": 167750 }, { "epoch": 1.81, "learning_rate": 2.79626386456509e-05, "loss": 0.0063, "step": 167760 }, { "epoch": 1.81, "learning_rate": 2.7946422780047994e-05, "loss": 0.0063, "step": 167770 }, { "epoch": 1.81, "learning_rate": 2.7930206914445093e-05, "loss": 0.0064, "step": 167780 }, { "epoch": 1.81, "learning_rate": 2.7913991048842186e-05, "loss": 0.005, "step": 167790 }, { "epoch": 1.81, "learning_rate": 2.7897775183239282e-05, "loss": 0.0067, "step": 167800 }, { "epoch": 1.81, "learning_rate": 2.7881559317636375e-05, "loss": 0.0067, "step": 167810 }, { "epoch": 1.81, "learning_rate": 2.7865343452033467e-05, "loss": 0.0072, "step": 167820 }, { "epoch": 1.81, "learning_rate": 2.7849127586430564e-05, "loss": 0.0054, "step": 167830 }, { "epoch": 1.81, "learning_rate": 2.7832911720827656e-05, "loss": 0.005, "step": 167840 }, { "epoch": 1.81, "learning_rate": 2.781669585522475e-05, "loss": 0.0061, "step": 167850 }, { "epoch": 1.81, "learning_rate": 2.7800479989621845e-05, "loss": 0.0056, "step": 167860 }, { "epoch": 1.81, "learning_rate": 2.7784264124018938e-05, "loss": 0.0059, "step": 167870 }, { "epoch": 1.81, "learning_rate": 2.7768048258416034e-05, "loss": 0.0059, "step": 167880 }, { "epoch": 1.81, "learning_rate": 2.7751832392813127e-05, "loss": 0.0068, "step": 167890 }, { "epoch": 1.82, "learning_rate": 2.773561652721022e-05, "loss": 0.0057, "step": 167900 }, { "epoch": 1.82, "learning_rate": 2.7719400661607316e-05, "loss": 0.007, "step": 167910 }, { "epoch": 1.82, "learning_rate": 2.770318479600441e-05, "loss": 0.007, "step": 167920 }, { "epoch": 1.82, "learning_rate": 2.76869689304015e-05, "loss": 0.0052, "step": 167930 }, { "epoch": 1.82, "learning_rate": 2.7670753064798597e-05, "loss": 0.0044, "step": 167940 }, { "epoch": 1.82, "learning_rate": 2.765453719919569e-05, "loss": 0.0099, "step": 167950 }, { "epoch": 1.82, "learning_rate": 2.7638321333592786e-05, "loss": 0.0063, "step": 167960 }, { "epoch": 1.82, "learning_rate": 2.762210546798988e-05, "loss": 0.0044, "step": 167970 }, { "epoch": 1.82, "learning_rate": 2.760588960238697e-05, "loss": 0.0051, "step": 167980 }, { "epoch": 1.82, "learning_rate": 2.7589673736784068e-05, "loss": 0.0067, "step": 167990 }, { "epoch": 1.82, "learning_rate": 2.757345787118116e-05, "loss": 0.0063, "step": 168000 }, { "epoch": 1.82, "eval_cer": 0.9215182484795105, "eval_loss": 0.005569620057940483, "eval_runtime": 121.2406, "eval_samples_per_second": 16.496, "eval_steps_per_second": 4.124, "step": 168000 }, { "epoch": 1.82, "learning_rate": 2.7557242005578253e-05, "loss": 0.0068, "step": 168010 }, { "epoch": 1.82, "learning_rate": 2.754102613997535e-05, "loss": 0.0071, "step": 168020 }, { "epoch": 1.82, "learning_rate": 2.7524810274372442e-05, "loss": 0.0069, "step": 168030 }, { "epoch": 1.82, "learning_rate": 2.7508594408769538e-05, "loss": 0.0067, "step": 168040 }, { "epoch": 1.82, "learning_rate": 2.749237854316663e-05, "loss": 0.0055, "step": 168050 }, { "epoch": 1.82, "learning_rate": 2.7476162677563724e-05, "loss": 0.0056, "step": 168060 }, { "epoch": 1.82, "learning_rate": 2.745994681196082e-05, "loss": 0.0053, "step": 168070 }, { "epoch": 1.82, "learning_rate": 2.7443730946357913e-05, "loss": 0.0072, "step": 168080 }, { "epoch": 1.82, "learning_rate": 2.7427515080755005e-05, "loss": 0.0065, "step": 168090 }, { "epoch": 1.82, "learning_rate": 2.74112992151521e-05, "loss": 0.0093, "step": 168100 }, { "epoch": 1.82, "learning_rate": 2.7395083349549194e-05, "loss": 0.0053, "step": 168110 }, { "epoch": 1.82, "learning_rate": 2.737886748394629e-05, "loss": 0.0072, "step": 168120 }, { "epoch": 1.82, "learning_rate": 2.7362651618343383e-05, "loss": 0.0112, "step": 168130 }, { "epoch": 1.82, "learning_rate": 2.734643575274048e-05, "loss": 0.0063, "step": 168140 }, { "epoch": 1.82, "learning_rate": 2.7330219887137575e-05, "loss": 0.0046, "step": 168150 }, { "epoch": 1.82, "learning_rate": 2.7314004021534668e-05, "loss": 0.0058, "step": 168160 }, { "epoch": 1.82, "learning_rate": 2.7297788155931764e-05, "loss": 0.0067, "step": 168170 }, { "epoch": 1.82, "learning_rate": 2.7281572290328857e-05, "loss": 0.0066, "step": 168180 }, { "epoch": 1.82, "learning_rate": 2.726535642472595e-05, "loss": 0.0065, "step": 168190 }, { "epoch": 1.82, "learning_rate": 2.7249140559123046e-05, "loss": 0.0077, "step": 168200 }, { "epoch": 1.82, "learning_rate": 2.723292469352014e-05, "loss": 0.0049, "step": 168210 }, { "epoch": 1.82, "learning_rate": 2.721670882791723e-05, "loss": 0.0081, "step": 168220 }, { "epoch": 1.82, "learning_rate": 2.7200492962314328e-05, "loss": 0.0051, "step": 168230 }, { "epoch": 1.82, "learning_rate": 2.718427709671142e-05, "loss": 0.0059, "step": 168240 }, { "epoch": 1.82, "learning_rate": 2.7168061231108516e-05, "loss": 0.0055, "step": 168250 }, { "epoch": 1.82, "learning_rate": 2.715184536550561e-05, "loss": 0.0052, "step": 168260 }, { "epoch": 1.82, "learning_rate": 2.7135629499902702e-05, "loss": 0.0074, "step": 168270 }, { "epoch": 1.82, "learning_rate": 2.7119413634299798e-05, "loss": 0.0078, "step": 168280 }, { "epoch": 1.82, "learning_rate": 2.710319776869689e-05, "loss": 0.0067, "step": 168290 }, { "epoch": 1.82, "learning_rate": 2.7086981903093984e-05, "loss": 0.005, "step": 168300 }, { "epoch": 1.82, "learning_rate": 2.707076603749108e-05, "loss": 0.007, "step": 168310 }, { "epoch": 1.82, "learning_rate": 2.7054550171888172e-05, "loss": 0.0083, "step": 168320 }, { "epoch": 1.82, "learning_rate": 2.703833430628527e-05, "loss": 0.0077, "step": 168330 }, { "epoch": 1.82, "learning_rate": 2.702211844068236e-05, "loss": 0.0053, "step": 168340 }, { "epoch": 1.82, "learning_rate": 2.7005902575079454e-05, "loss": 0.0087, "step": 168350 }, { "epoch": 1.82, "learning_rate": 2.698968670947655e-05, "loss": 0.0065, "step": 168360 }, { "epoch": 1.82, "learning_rate": 2.6973470843873643e-05, "loss": 0.0096, "step": 168370 }, { "epoch": 1.82, "learning_rate": 2.6957254978270736e-05, "loss": 0.0052, "step": 168380 }, { "epoch": 1.82, "learning_rate": 2.6941039112667832e-05, "loss": 0.0064, "step": 168390 }, { "epoch": 1.82, "learning_rate": 2.6924823247064924e-05, "loss": 0.0077, "step": 168400 }, { "epoch": 1.82, "learning_rate": 2.690860738146202e-05, "loss": 0.0046, "step": 168410 }, { "epoch": 1.82, "learning_rate": 2.6892391515859113e-05, "loss": 0.0069, "step": 168420 }, { "epoch": 1.82, "learning_rate": 2.6876175650256206e-05, "loss": 0.0059, "step": 168430 }, { "epoch": 1.82, "learning_rate": 2.6859959784653302e-05, "loss": 0.0079, "step": 168440 }, { "epoch": 1.82, "learning_rate": 2.6843743919050395e-05, "loss": 0.0082, "step": 168450 }, { "epoch": 1.82, "learning_rate": 2.6827528053447488e-05, "loss": 0.0079, "step": 168460 }, { "epoch": 1.82, "learning_rate": 2.6811312187844584e-05, "loss": 0.0061, "step": 168470 }, { "epoch": 1.82, "learning_rate": 2.6795096322241677e-05, "loss": 0.0065, "step": 168480 }, { "epoch": 1.82, "learning_rate": 2.677888045663877e-05, "loss": 0.0058, "step": 168490 }, { "epoch": 1.82, "learning_rate": 2.676266459103587e-05, "loss": 0.0074, "step": 168500 }, { "epoch": 1.82, "learning_rate": 2.674644872543296e-05, "loss": 0.0048, "step": 168510 }, { "epoch": 1.82, "learning_rate": 2.6730232859830058e-05, "loss": 0.0059, "step": 168520 }, { "epoch": 1.82, "learning_rate": 2.671401699422715e-05, "loss": 0.0071, "step": 168530 }, { "epoch": 1.82, "learning_rate": 2.6697801128624247e-05, "loss": 0.0075, "step": 168540 }, { "epoch": 1.82, "learning_rate": 2.668158526302134e-05, "loss": 0.0064, "step": 168550 }, { "epoch": 1.82, "learning_rate": 2.6665369397418432e-05, "loss": 0.0066, "step": 168560 }, { "epoch": 1.82, "learning_rate": 2.6649153531815528e-05, "loss": 0.0075, "step": 168570 }, { "epoch": 1.82, "learning_rate": 2.663293766621262e-05, "loss": 0.0075, "step": 168580 }, { "epoch": 1.82, "learning_rate": 2.6616721800609714e-05, "loss": 0.0051, "step": 168590 }, { "epoch": 1.82, "learning_rate": 2.660050593500681e-05, "loss": 0.0064, "step": 168600 }, { "epoch": 1.82, "learning_rate": 2.6584290069403903e-05, "loss": 0.0068, "step": 168610 }, { "epoch": 1.82, "learning_rate": 2.6568074203801e-05, "loss": 0.0073, "step": 168620 }, { "epoch": 1.82, "learning_rate": 2.655185833819809e-05, "loss": 0.0053, "step": 168630 }, { "epoch": 1.82, "learning_rate": 2.6535642472595184e-05, "loss": 0.0064, "step": 168640 }, { "epoch": 1.82, "learning_rate": 2.651942660699228e-05, "loss": 0.0086, "step": 168650 }, { "epoch": 1.82, "learning_rate": 2.6503210741389373e-05, "loss": 0.0059, "step": 168660 }, { "epoch": 1.82, "learning_rate": 2.6486994875786466e-05, "loss": 0.0069, "step": 168670 }, { "epoch": 1.82, "learning_rate": 2.6470779010183562e-05, "loss": 0.0082, "step": 168680 }, { "epoch": 1.82, "learning_rate": 2.6454563144580655e-05, "loss": 0.0053, "step": 168690 }, { "epoch": 1.82, "learning_rate": 2.643834727897775e-05, "loss": 0.0058, "step": 168700 }, { "epoch": 1.82, "learning_rate": 2.6422131413374844e-05, "loss": 0.0074, "step": 168710 }, { "epoch": 1.82, "learning_rate": 2.6405915547771936e-05, "loss": 0.0054, "step": 168720 }, { "epoch": 1.82, "learning_rate": 2.6389699682169032e-05, "loss": 0.0061, "step": 168730 }, { "epoch": 1.82, "learning_rate": 2.6373483816566125e-05, "loss": 0.0053, "step": 168740 }, { "epoch": 1.82, "learning_rate": 2.6357267950963218e-05, "loss": 0.0079, "step": 168750 }, { "epoch": 1.82, "learning_rate": 2.6341052085360314e-05, "loss": 0.0067, "step": 168760 }, { "epoch": 1.82, "learning_rate": 2.6324836219757407e-05, "loss": 0.0069, "step": 168770 }, { "epoch": 1.82, "learning_rate": 2.63086203541545e-05, "loss": 0.0066, "step": 168780 }, { "epoch": 1.82, "learning_rate": 2.6292404488551596e-05, "loss": 0.0064, "step": 168790 }, { "epoch": 1.82, "learning_rate": 2.627618862294869e-05, "loss": 0.0052, "step": 168800 }, { "epoch": 1.82, "learning_rate": 2.6259972757345785e-05, "loss": 0.0075, "step": 168810 }, { "epoch": 1.83, "learning_rate": 2.6243756891742877e-05, "loss": 0.006, "step": 168820 }, { "epoch": 1.83, "learning_rate": 2.622754102613997e-05, "loss": 0.0075, "step": 168830 }, { "epoch": 1.83, "learning_rate": 2.6211325160537066e-05, "loss": 0.0051, "step": 168840 }, { "epoch": 1.83, "learning_rate": 2.619510929493416e-05, "loss": 0.0069, "step": 168850 }, { "epoch": 1.83, "learning_rate": 2.617889342933126e-05, "loss": 0.0058, "step": 168860 }, { "epoch": 1.83, "learning_rate": 2.616267756372835e-05, "loss": 0.0066, "step": 168870 }, { "epoch": 1.83, "learning_rate": 2.6146461698125444e-05, "loss": 0.0068, "step": 168880 }, { "epoch": 1.83, "learning_rate": 2.613024583252254e-05, "loss": 0.0059, "step": 168890 }, { "epoch": 1.83, "learning_rate": 2.6114029966919633e-05, "loss": 0.0061, "step": 168900 }, { "epoch": 1.83, "learning_rate": 2.609781410131673e-05, "loss": 0.0066, "step": 168910 }, { "epoch": 1.83, "learning_rate": 2.6081598235713822e-05, "loss": 0.004, "step": 168920 }, { "epoch": 1.83, "learning_rate": 2.6065382370110914e-05, "loss": 0.0078, "step": 168930 }, { "epoch": 1.83, "learning_rate": 2.604916650450801e-05, "loss": 0.0049, "step": 168940 }, { "epoch": 1.83, "learning_rate": 2.6032950638905103e-05, "loss": 0.0077, "step": 168950 }, { "epoch": 1.83, "learning_rate": 2.6016734773302196e-05, "loss": 0.0054, "step": 168960 }, { "epoch": 1.83, "learning_rate": 2.6000518907699292e-05, "loss": 0.0067, "step": 168970 }, { "epoch": 1.83, "learning_rate": 2.5984303042096385e-05, "loss": 0.0077, "step": 168980 }, { "epoch": 1.83, "learning_rate": 2.596808717649348e-05, "loss": 0.0074, "step": 168990 }, { "epoch": 1.83, "learning_rate": 2.5951871310890574e-05, "loss": 0.0058, "step": 169000 }, { "epoch": 1.83, "eval_cer": 0.9215139054647287, "eval_loss": 0.005461297929286957, "eval_runtime": 121.167, "eval_samples_per_second": 16.506, "eval_steps_per_second": 4.127, "step": 169000 }, { "epoch": 1.83, "learning_rate": 2.5935655445287667e-05, "loss": 0.005, "step": 169010 }, { "epoch": 1.83, "learning_rate": 2.5919439579684763e-05, "loss": 0.0074, "step": 169020 }, { "epoch": 1.83, "learning_rate": 2.5903223714081855e-05, "loss": 0.007, "step": 169030 }, { "epoch": 1.83, "learning_rate": 2.5887007848478948e-05, "loss": 0.0058, "step": 169040 }, { "epoch": 1.83, "learning_rate": 2.5870791982876044e-05, "loss": 0.0069, "step": 169050 }, { "epoch": 1.83, "learning_rate": 2.5854576117273137e-05, "loss": 0.0084, "step": 169060 }, { "epoch": 1.83, "learning_rate": 2.5838360251670233e-05, "loss": 0.0104, "step": 169070 }, { "epoch": 1.83, "learning_rate": 2.5822144386067326e-05, "loss": 0.0064, "step": 169080 }, { "epoch": 1.83, "learning_rate": 2.580592852046442e-05, "loss": 0.0059, "step": 169090 }, { "epoch": 1.83, "learning_rate": 2.5789712654861515e-05, "loss": 0.007, "step": 169100 }, { "epoch": 1.83, "learning_rate": 2.5773496789258608e-05, "loss": 0.0083, "step": 169110 }, { "epoch": 1.83, "learning_rate": 2.57572809236557e-05, "loss": 0.0107, "step": 169120 }, { "epoch": 1.83, "learning_rate": 2.5741065058052796e-05, "loss": 0.0068, "step": 169130 }, { "epoch": 1.83, "learning_rate": 2.572484919244989e-05, "loss": 0.0062, "step": 169140 }, { "epoch": 1.83, "learning_rate": 2.5708633326846982e-05, "loss": 0.0058, "step": 169150 }, { "epoch": 1.83, "learning_rate": 2.5692417461244078e-05, "loss": 0.0054, "step": 169160 }, { "epoch": 1.83, "learning_rate": 2.567620159564117e-05, "loss": 0.0083, "step": 169170 }, { "epoch": 1.83, "learning_rate": 2.5659985730038267e-05, "loss": 0.0066, "step": 169180 }, { "epoch": 1.83, "learning_rate": 2.564376986443536e-05, "loss": 0.0049, "step": 169190 }, { "epoch": 1.83, "learning_rate": 2.5627553998832452e-05, "loss": 0.0073, "step": 169200 }, { "epoch": 1.83, "learning_rate": 2.561133813322955e-05, "loss": 0.0079, "step": 169210 }, { "epoch": 1.83, "learning_rate": 2.5595122267626645e-05, "loss": 0.0065, "step": 169220 }, { "epoch": 1.83, "learning_rate": 2.557890640202374e-05, "loss": 0.0057, "step": 169230 }, { "epoch": 1.83, "learning_rate": 2.5562690536420834e-05, "loss": 0.0055, "step": 169240 }, { "epoch": 1.83, "learning_rate": 2.5546474670817926e-05, "loss": 0.0074, "step": 169250 }, { "epoch": 1.83, "learning_rate": 2.5530258805215022e-05, "loss": 0.0064, "step": 169260 }, { "epoch": 1.83, "learning_rate": 2.5514042939612115e-05, "loss": 0.007, "step": 169270 }, { "epoch": 1.83, "learning_rate": 2.549782707400921e-05, "loss": 0.0075, "step": 169280 }, { "epoch": 1.83, "learning_rate": 2.5481611208406304e-05, "loss": 0.0051, "step": 169290 }, { "epoch": 1.83, "learning_rate": 2.5465395342803397e-05, "loss": 0.0075, "step": 169300 }, { "epoch": 1.83, "learning_rate": 2.5449179477200493e-05, "loss": 0.0103, "step": 169310 }, { "epoch": 1.83, "learning_rate": 2.5432963611597586e-05, "loss": 0.0071, "step": 169320 }, { "epoch": 1.83, "learning_rate": 2.541674774599468e-05, "loss": 0.0057, "step": 169330 }, { "epoch": 1.83, "learning_rate": 2.5400531880391775e-05, "loss": 0.007, "step": 169340 }, { "epoch": 1.83, "learning_rate": 2.5384316014788867e-05, "loss": 0.009, "step": 169350 }, { "epoch": 1.83, "learning_rate": 2.5368100149185963e-05, "loss": 0.0064, "step": 169360 }, { "epoch": 1.83, "learning_rate": 2.5351884283583056e-05, "loss": 0.0068, "step": 169370 }, { "epoch": 1.83, "learning_rate": 2.533566841798015e-05, "loss": 0.0079, "step": 169380 }, { "epoch": 1.83, "learning_rate": 2.5319452552377245e-05, "loss": 0.0071, "step": 169390 }, { "epoch": 1.83, "learning_rate": 2.5303236686774338e-05, "loss": 0.0053, "step": 169400 }, { "epoch": 1.83, "learning_rate": 2.528702082117143e-05, "loss": 0.0076, "step": 169410 }, { "epoch": 1.83, "learning_rate": 2.5270804955568527e-05, "loss": 0.006, "step": 169420 }, { "epoch": 1.83, "learning_rate": 2.525458908996562e-05, "loss": 0.0057, "step": 169430 }, { "epoch": 1.83, "learning_rate": 2.5238373224362712e-05, "loss": 0.0049, "step": 169440 }, { "epoch": 1.83, "learning_rate": 2.5222157358759808e-05, "loss": 0.0075, "step": 169450 }, { "epoch": 1.83, "learning_rate": 2.52059414931569e-05, "loss": 0.0053, "step": 169460 }, { "epoch": 1.83, "learning_rate": 2.5189725627553997e-05, "loss": 0.0062, "step": 169470 }, { "epoch": 1.83, "learning_rate": 2.517350976195109e-05, "loss": 0.0053, "step": 169480 }, { "epoch": 1.83, "learning_rate": 2.5157293896348183e-05, "loss": 0.0083, "step": 169490 }, { "epoch": 1.83, "learning_rate": 2.514107803074528e-05, "loss": 0.0053, "step": 169500 }, { "epoch": 1.83, "learning_rate": 2.512486216514237e-05, "loss": 0.0066, "step": 169510 }, { "epoch": 1.83, "learning_rate": 2.5108646299539464e-05, "loss": 0.0077, "step": 169520 }, { "epoch": 1.83, "learning_rate": 2.509243043393656e-05, "loss": 0.0043, "step": 169530 }, { "epoch": 1.83, "learning_rate": 2.5076214568333653e-05, "loss": 0.0059, "step": 169540 }, { "epoch": 1.83, "learning_rate": 2.505999870273075e-05, "loss": 0.0052, "step": 169550 }, { "epoch": 1.83, "learning_rate": 2.5043782837127842e-05, "loss": 0.0054, "step": 169560 }, { "epoch": 1.83, "learning_rate": 2.5027566971524935e-05, "loss": 0.0058, "step": 169570 }, { "epoch": 1.83, "learning_rate": 2.5011351105922034e-05, "loss": 0.0074, "step": 169580 }, { "epoch": 1.83, "learning_rate": 2.4995135240319127e-05, "loss": 0.0048, "step": 169590 }, { "epoch": 1.83, "learning_rate": 2.4978919374716223e-05, "loss": 0.0049, "step": 169600 }, { "epoch": 1.83, "learning_rate": 2.4962703509113316e-05, "loss": 0.0088, "step": 169610 }, { "epoch": 1.83, "learning_rate": 2.494648764351041e-05, "loss": 0.0067, "step": 169620 }, { "epoch": 1.83, "learning_rate": 2.4930271777907505e-05, "loss": 0.0076, "step": 169630 }, { "epoch": 1.83, "learning_rate": 2.4914055912304597e-05, "loss": 0.0089, "step": 169640 }, { "epoch": 1.83, "learning_rate": 2.4897840046701694e-05, "loss": 0.0077, "step": 169650 }, { "epoch": 1.83, "learning_rate": 2.4881624181098786e-05, "loss": 0.0071, "step": 169660 }, { "epoch": 1.83, "learning_rate": 2.486540831549588e-05, "loss": 0.0066, "step": 169670 }, { "epoch": 1.83, "learning_rate": 2.4849192449892975e-05, "loss": 0.0054, "step": 169680 }, { "epoch": 1.83, "learning_rate": 2.4832976584290068e-05, "loss": 0.0084, "step": 169690 }, { "epoch": 1.83, "learning_rate": 2.481676071868716e-05, "loss": 0.0083, "step": 169700 }, { "epoch": 1.83, "learning_rate": 2.4800544853084257e-05, "loss": 0.0072, "step": 169710 }, { "epoch": 1.83, "learning_rate": 2.478432898748135e-05, "loss": 0.0062, "step": 169720 }, { "epoch": 1.83, "learning_rate": 2.4768113121878442e-05, "loss": 0.0051, "step": 169730 }, { "epoch": 1.83, "learning_rate": 2.475189725627554e-05, "loss": 0.0063, "step": 169740 }, { "epoch": 1.84, "learning_rate": 2.473568139067263e-05, "loss": 0.0063, "step": 169750 }, { "epoch": 1.84, "learning_rate": 2.4719465525069727e-05, "loss": 0.0062, "step": 169760 }, { "epoch": 1.84, "learning_rate": 2.470324965946682e-05, "loss": 0.0077, "step": 169770 }, { "epoch": 1.84, "learning_rate": 2.4687033793863913e-05, "loss": 0.0068, "step": 169780 }, { "epoch": 1.84, "learning_rate": 2.467081792826101e-05, "loss": 0.0056, "step": 169790 }, { "epoch": 1.84, "learning_rate": 2.4654602062658102e-05, "loss": 0.0066, "step": 169800 }, { "epoch": 1.84, "learning_rate": 2.4638386197055194e-05, "loss": 0.0055, "step": 169810 }, { "epoch": 1.84, "learning_rate": 2.462217033145229e-05, "loss": 0.0065, "step": 169820 }, { "epoch": 1.84, "learning_rate": 2.4605954465849383e-05, "loss": 0.0067, "step": 169830 }, { "epoch": 1.84, "learning_rate": 2.458973860024648e-05, "loss": 0.007, "step": 169840 }, { "epoch": 1.84, "learning_rate": 2.4573522734643572e-05, "loss": 0.0056, "step": 169850 }, { "epoch": 1.84, "learning_rate": 2.4557306869040665e-05, "loss": 0.0064, "step": 169860 }, { "epoch": 1.84, "learning_rate": 2.454109100343776e-05, "loss": 0.0075, "step": 169870 }, { "epoch": 1.84, "learning_rate": 2.4524875137834854e-05, "loss": 0.0055, "step": 169880 }, { "epoch": 1.84, "learning_rate": 2.4508659272231947e-05, "loss": 0.008, "step": 169890 }, { "epoch": 1.84, "learning_rate": 2.4492443406629043e-05, "loss": 0.0076, "step": 169900 }, { "epoch": 1.84, "learning_rate": 2.4476227541026135e-05, "loss": 0.01, "step": 169910 }, { "epoch": 1.84, "learning_rate": 2.446001167542323e-05, "loss": 0.0049, "step": 169920 }, { "epoch": 1.84, "learning_rate": 2.4443795809820324e-05, "loss": 0.0049, "step": 169930 }, { "epoch": 1.84, "learning_rate": 2.4427579944217424e-05, "loss": 0.0057, "step": 169940 }, { "epoch": 1.84, "learning_rate": 2.4411364078614517e-05, "loss": 0.0078, "step": 169950 }, { "epoch": 1.84, "learning_rate": 2.439514821301161e-05, "loss": 0.007, "step": 169960 }, { "epoch": 1.84, "learning_rate": 2.4378932347408705e-05, "loss": 0.0073, "step": 169970 }, { "epoch": 1.84, "learning_rate": 2.4362716481805798e-05, "loss": 0.0065, "step": 169980 }, { "epoch": 1.84, "learning_rate": 2.434650061620289e-05, "loss": 0.0051, "step": 169990 }, { "epoch": 1.84, "learning_rate": 2.4330284750599987e-05, "loss": 0.0058, "step": 170000 }, { "epoch": 1.84, "eval_cer": 0.9215234600972488, "eval_loss": 0.005428744480013847, "eval_runtime": 121.1672, "eval_samples_per_second": 16.506, "eval_steps_per_second": 4.127, "step": 170000 }, { "epoch": 1.84, "learning_rate": 2.431406888499708e-05, "loss": 0.0068, "step": 170010 }, { "epoch": 1.84, "learning_rate": 2.4297853019394173e-05, "loss": 0.0056, "step": 170020 }, { "epoch": 1.84, "learning_rate": 2.428163715379127e-05, "loss": 0.0079, "step": 170030 }, { "epoch": 1.84, "learning_rate": 2.426542128818836e-05, "loss": 0.0074, "step": 170040 }, { "epoch": 1.84, "learning_rate": 2.4249205422585458e-05, "loss": 0.007, "step": 170050 }, { "epoch": 1.84, "learning_rate": 2.423298955698255e-05, "loss": 0.0058, "step": 170060 }, { "epoch": 1.84, "learning_rate": 2.4216773691379643e-05, "loss": 0.0063, "step": 170070 }, { "epoch": 1.84, "learning_rate": 2.420055782577674e-05, "loss": 0.0093, "step": 170080 }, { "epoch": 1.84, "learning_rate": 2.4184341960173832e-05, "loss": 0.008, "step": 170090 }, { "epoch": 1.84, "learning_rate": 2.4168126094570925e-05, "loss": 0.0059, "step": 170100 }, { "epoch": 1.84, "learning_rate": 2.415191022896802e-05, "loss": 0.0082, "step": 170110 }, { "epoch": 1.84, "learning_rate": 2.4135694363365114e-05, "loss": 0.0055, "step": 170120 }, { "epoch": 1.84, "learning_rate": 2.411947849776221e-05, "loss": 0.0051, "step": 170130 }, { "epoch": 1.84, "learning_rate": 2.4103262632159302e-05, "loss": 0.0059, "step": 170140 }, { "epoch": 1.84, "learning_rate": 2.4087046766556395e-05, "loss": 0.0068, "step": 170150 }, { "epoch": 1.84, "learning_rate": 2.407083090095349e-05, "loss": 0.0083, "step": 170160 }, { "epoch": 1.84, "learning_rate": 2.4054615035350584e-05, "loss": 0.0062, "step": 170170 }, { "epoch": 1.84, "learning_rate": 2.4038399169747677e-05, "loss": 0.0079, "step": 170180 }, { "epoch": 1.84, "learning_rate": 2.4022183304144773e-05, "loss": 0.0067, "step": 170190 }, { "epoch": 1.84, "learning_rate": 2.4005967438541866e-05, "loss": 0.0059, "step": 170200 }, { "epoch": 1.84, "learning_rate": 2.3989751572938962e-05, "loss": 0.007, "step": 170210 }, { "epoch": 1.84, "learning_rate": 2.3973535707336055e-05, "loss": 0.006, "step": 170220 }, { "epoch": 1.84, "learning_rate": 2.3957319841733147e-05, "loss": 0.0076, "step": 170230 }, { "epoch": 1.84, "learning_rate": 2.3941103976130243e-05, "loss": 0.0062, "step": 170240 }, { "epoch": 1.84, "learning_rate": 2.3924888110527336e-05, "loss": 0.0055, "step": 170250 }, { "epoch": 1.84, "learning_rate": 2.390867224492443e-05, "loss": 0.008, "step": 170260 }, { "epoch": 1.84, "learning_rate": 2.3892456379321525e-05, "loss": 0.0055, "step": 170270 }, { "epoch": 1.84, "learning_rate": 2.3876240513718618e-05, "loss": 0.0071, "step": 170280 }, { "epoch": 1.84, "learning_rate": 2.3860024648115714e-05, "loss": 0.0045, "step": 170290 }, { "epoch": 1.84, "learning_rate": 2.384380878251281e-05, "loss": 0.0086, "step": 170300 }, { "epoch": 1.84, "learning_rate": 2.3827592916909903e-05, "loss": 0.0058, "step": 170310 }, { "epoch": 1.84, "learning_rate": 2.3811377051307e-05, "loss": 0.0053, "step": 170320 }, { "epoch": 1.84, "learning_rate": 2.379516118570409e-05, "loss": 0.0066, "step": 170330 }, { "epoch": 1.84, "learning_rate": 2.3778945320101188e-05, "loss": 0.0053, "step": 170340 }, { "epoch": 1.84, "learning_rate": 2.376272945449828e-05, "loss": 0.006, "step": 170350 }, { "epoch": 1.84, "learning_rate": 2.3746513588895373e-05, "loss": 0.0057, "step": 170360 }, { "epoch": 1.84, "learning_rate": 2.373029772329247e-05, "loss": 0.0072, "step": 170370 }, { "epoch": 1.84, "learning_rate": 2.3714081857689562e-05, "loss": 0.0076, "step": 170380 }, { "epoch": 1.84, "learning_rate": 2.3697865992086655e-05, "loss": 0.0055, "step": 170390 }, { "epoch": 1.84, "learning_rate": 2.368165012648375e-05, "loss": 0.0058, "step": 170400 }, { "epoch": 1.84, "learning_rate": 2.3665434260880844e-05, "loss": 0.0075, "step": 170410 }, { "epoch": 1.84, "learning_rate": 2.364921839527794e-05, "loss": 0.0066, "step": 170420 }, { "epoch": 1.84, "learning_rate": 2.3633002529675033e-05, "loss": 0.0069, "step": 170430 }, { "epoch": 1.84, "learning_rate": 2.3616786664072125e-05, "loss": 0.0073, "step": 170440 }, { "epoch": 1.84, "learning_rate": 2.360057079846922e-05, "loss": 0.0065, "step": 170450 }, { "epoch": 1.84, "learning_rate": 2.3584354932866314e-05, "loss": 0.0081, "step": 170460 }, { "epoch": 1.84, "learning_rate": 2.3568139067263407e-05, "loss": 0.0055, "step": 170470 }, { "epoch": 1.84, "learning_rate": 2.3551923201660503e-05, "loss": 0.0074, "step": 170480 }, { "epoch": 1.84, "learning_rate": 2.3535707336057596e-05, "loss": 0.0057, "step": 170490 }, { "epoch": 1.84, "learning_rate": 2.3519491470454692e-05, "loss": 0.0065, "step": 170500 }, { "epoch": 1.84, "learning_rate": 2.3503275604851785e-05, "loss": 0.0059, "step": 170510 }, { "epoch": 1.84, "learning_rate": 2.3487059739248877e-05, "loss": 0.0065, "step": 170520 }, { "epoch": 1.84, "learning_rate": 2.3470843873645974e-05, "loss": 0.0077, "step": 170530 }, { "epoch": 1.84, "learning_rate": 2.3454628008043066e-05, "loss": 0.0075, "step": 170540 }, { "epoch": 1.84, "learning_rate": 2.343841214244016e-05, "loss": 0.0084, "step": 170550 }, { "epoch": 1.84, "learning_rate": 2.3422196276837255e-05, "loss": 0.0072, "step": 170560 }, { "epoch": 1.84, "learning_rate": 2.3405980411234348e-05, "loss": 0.0063, "step": 170570 }, { "epoch": 1.84, "learning_rate": 2.3389764545631444e-05, "loss": 0.0082, "step": 170580 }, { "epoch": 1.84, "learning_rate": 2.3373548680028537e-05, "loss": 0.0056, "step": 170590 }, { "epoch": 1.84, "learning_rate": 2.335733281442563e-05, "loss": 0.0117, "step": 170600 }, { "epoch": 1.84, "learning_rate": 2.3341116948822726e-05, "loss": 0.0089, "step": 170610 }, { "epoch": 1.84, "learning_rate": 2.332490108321982e-05, "loss": 0.0063, "step": 170620 }, { "epoch": 1.84, "learning_rate": 2.330868521761691e-05, "loss": 0.0053, "step": 170630 }, { "epoch": 1.84, "learning_rate": 2.3292469352014007e-05, "loss": 0.0043, "step": 170640 }, { "epoch": 1.84, "learning_rate": 2.32762534864111e-05, "loss": 0.0047, "step": 170650 }, { "epoch": 1.84, "learning_rate": 2.32600376208082e-05, "loss": 0.0076, "step": 170660 }, { "epoch": 1.85, "learning_rate": 2.3243821755205292e-05, "loss": 0.0073, "step": 170670 }, { "epoch": 1.85, "learning_rate": 2.3227605889602385e-05, "loss": 0.0064, "step": 170680 }, { "epoch": 1.85, "learning_rate": 2.321139002399948e-05, "loss": 0.0053, "step": 170690 }, { "epoch": 1.85, "learning_rate": 2.3195174158396574e-05, "loss": 0.0058, "step": 170700 }, { "epoch": 1.85, "learning_rate": 2.317895829279367e-05, "loss": 0.008, "step": 170710 }, { "epoch": 1.85, "learning_rate": 2.3162742427190763e-05, "loss": 0.0081, "step": 170720 }, { "epoch": 1.85, "learning_rate": 2.3146526561587856e-05, "loss": 0.0052, "step": 170730 }, { "epoch": 1.85, "learning_rate": 2.3130310695984952e-05, "loss": 0.0074, "step": 170740 }, { "epoch": 1.85, "learning_rate": 2.3114094830382044e-05, "loss": 0.0053, "step": 170750 }, { "epoch": 1.85, "learning_rate": 2.3097878964779137e-05, "loss": 0.0063, "step": 170760 }, { "epoch": 1.85, "learning_rate": 2.3081663099176233e-05, "loss": 0.0076, "step": 170770 }, { "epoch": 1.85, "learning_rate": 2.3065447233573326e-05, "loss": 0.0068, "step": 170780 }, { "epoch": 1.85, "learning_rate": 2.3049231367970422e-05, "loss": 0.0056, "step": 170790 }, { "epoch": 1.85, "learning_rate": 2.3033015502367515e-05, "loss": 0.0072, "step": 170800 }, { "epoch": 1.85, "learning_rate": 2.3016799636764608e-05, "loss": 0.0079, "step": 170810 }, { "epoch": 1.85, "learning_rate": 2.3000583771161704e-05, "loss": 0.0071, "step": 170820 }, { "epoch": 1.85, "learning_rate": 2.2984367905558797e-05, "loss": 0.0057, "step": 170830 }, { "epoch": 1.85, "learning_rate": 2.296815203995589e-05, "loss": 0.0062, "step": 170840 }, { "epoch": 1.85, "learning_rate": 2.2951936174352985e-05, "loss": 0.0074, "step": 170850 }, { "epoch": 1.85, "learning_rate": 2.2935720308750078e-05, "loss": 0.0048, "step": 170860 }, { "epoch": 1.85, "learning_rate": 2.2919504443147174e-05, "loss": 0.0066, "step": 170870 }, { "epoch": 1.85, "learning_rate": 2.2903288577544267e-05, "loss": 0.0067, "step": 170880 }, { "epoch": 1.85, "learning_rate": 2.288707271194136e-05, "loss": 0.0057, "step": 170890 }, { "epoch": 1.85, "learning_rate": 2.2870856846338456e-05, "loss": 0.0056, "step": 170900 }, { "epoch": 1.85, "learning_rate": 2.285464098073555e-05, "loss": 0.0052, "step": 170910 }, { "epoch": 1.85, "learning_rate": 2.283842511513264e-05, "loss": 0.0043, "step": 170920 }, { "epoch": 1.85, "learning_rate": 2.2822209249529738e-05, "loss": 0.0063, "step": 170930 }, { "epoch": 1.85, "learning_rate": 2.280599338392683e-05, "loss": 0.0054, "step": 170940 }, { "epoch": 1.85, "learning_rate": 2.2789777518323926e-05, "loss": 0.006, "step": 170950 }, { "epoch": 1.85, "learning_rate": 2.277356165272102e-05, "loss": 0.0049, "step": 170960 }, { "epoch": 1.85, "learning_rate": 2.2757345787118112e-05, "loss": 0.0062, "step": 170970 }, { "epoch": 1.85, "learning_rate": 2.2741129921515208e-05, "loss": 0.0053, "step": 170980 }, { "epoch": 1.85, "learning_rate": 2.27249140559123e-05, "loss": 0.0051, "step": 170990 }, { "epoch": 1.85, "learning_rate": 2.2708698190309394e-05, "loss": 0.0081, "step": 171000 }, { "epoch": 1.85, "eval_cer": 0.9215208542883797, "eval_loss": 0.005525045562535524, "eval_runtime": 121.1759, "eval_samples_per_second": 16.505, "eval_steps_per_second": 4.126, "step": 171000 }, { "epoch": 1.85, "learning_rate": 2.269248232470649e-05, "loss": 0.008, "step": 171010 }, { "epoch": 1.85, "learning_rate": 2.2676266459103586e-05, "loss": 0.0065, "step": 171020 }, { "epoch": 1.85, "learning_rate": 2.2660050593500682e-05, "loss": 0.0076, "step": 171030 }, { "epoch": 1.85, "learning_rate": 2.2643834727897775e-05, "loss": 0.0069, "step": 171040 }, { "epoch": 1.85, "learning_rate": 2.2627618862294867e-05, "loss": 0.0069, "step": 171050 }, { "epoch": 1.85, "learning_rate": 2.2611402996691964e-05, "loss": 0.0076, "step": 171060 }, { "epoch": 1.85, "learning_rate": 2.2595187131089056e-05, "loss": 0.0068, "step": 171070 }, { "epoch": 1.85, "learning_rate": 2.2578971265486152e-05, "loss": 0.0056, "step": 171080 }, { "epoch": 1.85, "learning_rate": 2.2562755399883245e-05, "loss": 0.0087, "step": 171090 }, { "epoch": 1.85, "learning_rate": 2.2546539534280338e-05, "loss": 0.0076, "step": 171100 }, { "epoch": 1.85, "learning_rate": 2.2530323668677434e-05, "loss": 0.0079, "step": 171110 }, { "epoch": 1.85, "learning_rate": 2.2514107803074527e-05, "loss": 0.0069, "step": 171120 }, { "epoch": 1.85, "learning_rate": 2.249789193747162e-05, "loss": 0.0057, "step": 171130 }, { "epoch": 1.85, "learning_rate": 2.2481676071868716e-05, "loss": 0.0055, "step": 171140 }, { "epoch": 1.85, "learning_rate": 2.246546020626581e-05, "loss": 0.0044, "step": 171150 }, { "epoch": 1.85, "learning_rate": 2.2449244340662905e-05, "loss": 0.0059, "step": 171160 }, { "epoch": 1.85, "learning_rate": 2.2433028475059997e-05, "loss": 0.0056, "step": 171170 }, { "epoch": 1.85, "learning_rate": 2.241681260945709e-05, "loss": 0.0057, "step": 171180 }, { "epoch": 1.85, "learning_rate": 2.2400596743854186e-05, "loss": 0.0064, "step": 171190 }, { "epoch": 1.85, "learning_rate": 2.238438087825128e-05, "loss": 0.0075, "step": 171200 }, { "epoch": 1.85, "learning_rate": 2.236816501264837e-05, "loss": 0.0065, "step": 171210 }, { "epoch": 1.85, "learning_rate": 2.2351949147045468e-05, "loss": 0.0053, "step": 171220 }, { "epoch": 1.85, "learning_rate": 2.233573328144256e-05, "loss": 0.0064, "step": 171230 }, { "epoch": 1.85, "learning_rate": 2.2319517415839657e-05, "loss": 0.0083, "step": 171240 }, { "epoch": 1.85, "learning_rate": 2.230330155023675e-05, "loss": 0.0069, "step": 171250 }, { "epoch": 1.85, "learning_rate": 2.2287085684633842e-05, "loss": 0.008, "step": 171260 }, { "epoch": 1.85, "learning_rate": 2.2270869819030938e-05, "loss": 0.006, "step": 171270 }, { "epoch": 1.85, "learning_rate": 2.225465395342803e-05, "loss": 0.0054, "step": 171280 }, { "epoch": 1.85, "learning_rate": 2.2238438087825124e-05, "loss": 0.0062, "step": 171290 }, { "epoch": 1.85, "learning_rate": 2.222222222222222e-05, "loss": 0.0077, "step": 171300 }, { "epoch": 1.85, "learning_rate": 2.2206006356619313e-05, "loss": 0.0071, "step": 171310 }, { "epoch": 1.85, "learning_rate": 2.2189790491016405e-05, "loss": 0.0058, "step": 171320 }, { "epoch": 1.85, "learning_rate": 2.21735746254135e-05, "loss": 0.0059, "step": 171330 }, { "epoch": 1.85, "learning_rate": 2.2157358759810594e-05, "loss": 0.0053, "step": 171340 }, { "epoch": 1.85, "learning_rate": 2.214114289420769e-05, "loss": 0.0077, "step": 171350 }, { "epoch": 1.85, "learning_rate": 2.2124927028604783e-05, "loss": 0.0074, "step": 171360 }, { "epoch": 1.85, "learning_rate": 2.2108711163001876e-05, "loss": 0.0056, "step": 171370 }, { "epoch": 1.85, "learning_rate": 2.2092495297398975e-05, "loss": 0.0049, "step": 171380 }, { "epoch": 1.85, "learning_rate": 2.2076279431796068e-05, "loss": 0.0073, "step": 171390 }, { "epoch": 1.85, "learning_rate": 2.2060063566193164e-05, "loss": 0.0092, "step": 171400 }, { "epoch": 1.85, "learning_rate": 2.2043847700590257e-05, "loss": 0.0058, "step": 171410 }, { "epoch": 1.85, "learning_rate": 2.202763183498735e-05, "loss": 0.0078, "step": 171420 }, { "epoch": 1.85, "learning_rate": 2.2011415969384446e-05, "loss": 0.0071, "step": 171430 }, { "epoch": 1.85, "learning_rate": 2.199520010378154e-05, "loss": 0.0067, "step": 171440 }, { "epoch": 1.85, "learning_rate": 2.1978984238178635e-05, "loss": 0.0077, "step": 171450 }, { "epoch": 1.85, "learning_rate": 2.1962768372575728e-05, "loss": 0.007, "step": 171460 }, { "epoch": 1.85, "learning_rate": 2.194655250697282e-05, "loss": 0.0063, "step": 171470 }, { "epoch": 1.85, "learning_rate": 2.1930336641369916e-05, "loss": 0.0058, "step": 171480 }, { "epoch": 1.85, "learning_rate": 2.191412077576701e-05, "loss": 0.006, "step": 171490 }, { "epoch": 1.85, "learning_rate": 2.1897904910164102e-05, "loss": 0.0049, "step": 171500 }, { "epoch": 1.85, "learning_rate": 2.1881689044561198e-05, "loss": 0.0075, "step": 171510 }, { "epoch": 1.85, "learning_rate": 2.186547317895829e-05, "loss": 0.0078, "step": 171520 }, { "epoch": 1.85, "learning_rate": 2.1849257313355387e-05, "loss": 0.0061, "step": 171530 }, { "epoch": 1.85, "learning_rate": 2.183304144775248e-05, "loss": 0.0068, "step": 171540 }, { "epoch": 1.85, "learning_rate": 2.1816825582149572e-05, "loss": 0.0062, "step": 171550 }, { "epoch": 1.85, "learning_rate": 2.180060971654667e-05, "loss": 0.0081, "step": 171560 }, { "epoch": 1.85, "learning_rate": 2.178439385094376e-05, "loss": 0.0031, "step": 171570 }, { "epoch": 1.85, "learning_rate": 2.1768177985340854e-05, "loss": 0.0063, "step": 171580 }, { "epoch": 1.85, "learning_rate": 2.175196211973795e-05, "loss": 0.0072, "step": 171590 }, { "epoch": 1.86, "learning_rate": 2.1735746254135043e-05, "loss": 0.005, "step": 171600 }, { "epoch": 1.86, "learning_rate": 2.1719530388532136e-05, "loss": 0.0066, "step": 171610 }, { "epoch": 1.86, "learning_rate": 2.1703314522929232e-05, "loss": 0.0062, "step": 171620 }, { "epoch": 1.86, "learning_rate": 2.1687098657326324e-05, "loss": 0.0062, "step": 171630 }, { "epoch": 1.86, "learning_rate": 2.167088279172342e-05, "loss": 0.006, "step": 171640 }, { "epoch": 1.86, "learning_rate": 2.1654666926120513e-05, "loss": 0.0076, "step": 171650 }, { "epoch": 1.86, "learning_rate": 2.1638451060517606e-05, "loss": 0.0069, "step": 171660 }, { "epoch": 1.86, "learning_rate": 2.1622235194914702e-05, "loss": 0.0061, "step": 171670 }, { "epoch": 1.86, "learning_rate": 2.1606019329311795e-05, "loss": 0.0052, "step": 171680 }, { "epoch": 1.86, "learning_rate": 2.1589803463708888e-05, "loss": 0.0057, "step": 171690 }, { "epoch": 1.86, "learning_rate": 2.1573587598105984e-05, "loss": 0.0069, "step": 171700 }, { "epoch": 1.86, "learning_rate": 2.1557371732503077e-05, "loss": 0.0067, "step": 171710 }, { "epoch": 1.86, "learning_rate": 2.1541155866900173e-05, "loss": 0.0065, "step": 171720 }, { "epoch": 1.86, "learning_rate": 2.1524940001297265e-05, "loss": 0.007, "step": 171730 }, { "epoch": 1.86, "learning_rate": 2.1508724135694365e-05, "loss": 0.006, "step": 171740 }, { "epoch": 1.86, "learning_rate": 2.1492508270091458e-05, "loss": 0.0066, "step": 171750 }, { "epoch": 1.86, "learning_rate": 2.147629240448855e-05, "loss": 0.007, "step": 171760 }, { "epoch": 1.86, "learning_rate": 2.1460076538885647e-05, "loss": 0.0078, "step": 171770 }, { "epoch": 1.86, "learning_rate": 2.144386067328274e-05, "loss": 0.0047, "step": 171780 }, { "epoch": 1.86, "learning_rate": 2.1427644807679832e-05, "loss": 0.0054, "step": 171790 }, { "epoch": 1.86, "learning_rate": 2.1411428942076928e-05, "loss": 0.0057, "step": 171800 }, { "epoch": 1.86, "learning_rate": 2.139521307647402e-05, "loss": 0.0071, "step": 171810 }, { "epoch": 1.86, "learning_rate": 2.1378997210871117e-05, "loss": 0.0091, "step": 171820 }, { "epoch": 1.86, "learning_rate": 2.136278134526821e-05, "loss": 0.0067, "step": 171830 }, { "epoch": 1.86, "learning_rate": 2.1346565479665303e-05, "loss": 0.0058, "step": 171840 }, { "epoch": 1.86, "learning_rate": 2.13303496140624e-05, "loss": 0.0065, "step": 171850 }, { "epoch": 1.86, "learning_rate": 2.131413374845949e-05, "loss": 0.0047, "step": 171860 }, { "epoch": 1.86, "learning_rate": 2.1297917882856584e-05, "loss": 0.0064, "step": 171870 }, { "epoch": 1.86, "learning_rate": 2.128170201725368e-05, "loss": 0.0071, "step": 171880 }, { "epoch": 1.86, "learning_rate": 2.1265486151650773e-05, "loss": 0.0054, "step": 171890 }, { "epoch": 1.86, "learning_rate": 2.124927028604787e-05, "loss": 0.0077, "step": 171900 }, { "epoch": 1.86, "learning_rate": 2.1233054420444962e-05, "loss": 0.0075, "step": 171910 }, { "epoch": 1.86, "learning_rate": 2.1216838554842055e-05, "loss": 0.0057, "step": 171920 }, { "epoch": 1.86, "learning_rate": 2.120062268923915e-05, "loss": 0.009, "step": 171930 }, { "epoch": 1.86, "learning_rate": 2.1184406823636244e-05, "loss": 0.0066, "step": 171940 }, { "epoch": 1.86, "learning_rate": 2.1168190958033336e-05, "loss": 0.0066, "step": 171950 }, { "epoch": 1.86, "learning_rate": 2.1151975092430432e-05, "loss": 0.0084, "step": 171960 }, { "epoch": 1.86, "learning_rate": 2.1135759226827525e-05, "loss": 0.0036, "step": 171970 }, { "epoch": 1.86, "learning_rate": 2.1119543361224618e-05, "loss": 0.0056, "step": 171980 }, { "epoch": 1.86, "learning_rate": 2.1103327495621714e-05, "loss": 0.0076, "step": 171990 }, { "epoch": 1.86, "learning_rate": 2.1087111630018807e-05, "loss": 0.0071, "step": 172000 }, { "epoch": 1.86, "eval_cer": 0.9215199856854233, "eval_loss": 0.005438223015516996, "eval_runtime": 121.1016, "eval_samples_per_second": 16.515, "eval_steps_per_second": 4.129, "step": 172000 }, { "epoch": 1.86, "learning_rate": 2.1070895764415903e-05, "loss": 0.0054, "step": 172010 }, { "epoch": 1.86, "learning_rate": 2.1054679898812996e-05, "loss": 0.0061, "step": 172020 }, { "epoch": 1.86, "learning_rate": 2.103846403321009e-05, "loss": 0.006, "step": 172030 }, { "epoch": 1.86, "learning_rate": 2.1022248167607185e-05, "loss": 0.0077, "step": 172040 }, { "epoch": 1.86, "learning_rate": 2.1006032302004277e-05, "loss": 0.0067, "step": 172050 }, { "epoch": 1.86, "learning_rate": 2.098981643640137e-05, "loss": 0.0065, "step": 172060 }, { "epoch": 1.86, "learning_rate": 2.0973600570798466e-05, "loss": 0.0071, "step": 172070 }, { "epoch": 1.86, "learning_rate": 2.095738470519556e-05, "loss": 0.0074, "step": 172080 }, { "epoch": 1.86, "learning_rate": 2.0941168839592655e-05, "loss": 0.0087, "step": 172090 }, { "epoch": 1.86, "learning_rate": 2.092495297398975e-05, "loss": 0.0058, "step": 172100 }, { "epoch": 1.86, "learning_rate": 2.0908737108386847e-05, "loss": 0.0055, "step": 172110 }, { "epoch": 1.86, "learning_rate": 2.089252124278394e-05, "loss": 0.0058, "step": 172120 }, { "epoch": 1.86, "learning_rate": 2.0876305377181033e-05, "loss": 0.007, "step": 172130 }, { "epoch": 1.86, "learning_rate": 2.086008951157813e-05, "loss": 0.0059, "step": 172140 }, { "epoch": 1.86, "learning_rate": 2.084387364597522e-05, "loss": 0.007, "step": 172150 }, { "epoch": 1.86, "learning_rate": 2.0827657780372314e-05, "loss": 0.0041, "step": 172160 }, { "epoch": 1.86, "learning_rate": 2.081144191476941e-05, "loss": 0.0062, "step": 172170 }, { "epoch": 1.86, "learning_rate": 2.0795226049166503e-05, "loss": 0.0058, "step": 172180 }, { "epoch": 1.86, "learning_rate": 2.07790101835636e-05, "loss": 0.0056, "step": 172190 }, { "epoch": 1.86, "learning_rate": 2.0762794317960692e-05, "loss": 0.0054, "step": 172200 }, { "epoch": 1.86, "learning_rate": 2.0746578452357785e-05, "loss": 0.0071, "step": 172210 }, { "epoch": 1.86, "learning_rate": 2.073036258675488e-05, "loss": 0.0077, "step": 172220 }, { "epoch": 1.86, "learning_rate": 2.0714146721151974e-05, "loss": 0.0056, "step": 172230 }, { "epoch": 1.86, "learning_rate": 2.0697930855549067e-05, "loss": 0.0052, "step": 172240 }, { "epoch": 1.86, "learning_rate": 2.0681714989946163e-05, "loss": 0.0054, "step": 172250 }, { "epoch": 1.86, "learning_rate": 2.0665499124343255e-05, "loss": 0.0069, "step": 172260 }, { "epoch": 1.86, "learning_rate": 2.0649283258740348e-05, "loss": 0.006, "step": 172270 }, { "epoch": 1.86, "learning_rate": 2.0633067393137444e-05, "loss": 0.0057, "step": 172280 }, { "epoch": 1.86, "learning_rate": 2.0616851527534537e-05, "loss": 0.0062, "step": 172290 }, { "epoch": 1.86, "learning_rate": 2.0600635661931633e-05, "loss": 0.0091, "step": 172300 }, { "epoch": 1.86, "learning_rate": 2.0584419796328726e-05, "loss": 0.0071, "step": 172310 }, { "epoch": 1.86, "learning_rate": 2.056820393072582e-05, "loss": 0.008, "step": 172320 }, { "epoch": 1.86, "learning_rate": 2.0551988065122915e-05, "loss": 0.0119, "step": 172330 }, { "epoch": 1.86, "learning_rate": 2.0535772199520008e-05, "loss": 0.0075, "step": 172340 }, { "epoch": 1.86, "learning_rate": 2.05195563339171e-05, "loss": 0.0069, "step": 172350 }, { "epoch": 1.86, "learning_rate": 2.0503340468314196e-05, "loss": 0.0067, "step": 172360 }, { "epoch": 1.86, "learning_rate": 2.048712460271129e-05, "loss": 0.0064, "step": 172370 }, { "epoch": 1.86, "learning_rate": 2.0470908737108385e-05, "loss": 0.0066, "step": 172380 }, { "epoch": 1.86, "learning_rate": 2.0454692871505478e-05, "loss": 0.0068, "step": 172390 }, { "epoch": 1.86, "learning_rate": 2.043847700590257e-05, "loss": 0.0074, "step": 172400 }, { "epoch": 1.86, "learning_rate": 2.0422261140299667e-05, "loss": 0.0058, "step": 172410 }, { "epoch": 1.86, "learning_rate": 2.040604527469676e-05, "loss": 0.0063, "step": 172420 }, { "epoch": 1.86, "learning_rate": 2.0389829409093852e-05, "loss": 0.0073, "step": 172430 }, { "epoch": 1.86, "learning_rate": 2.037361354349095e-05, "loss": 0.007, "step": 172440 }, { "epoch": 1.86, "learning_rate": 2.035739767788804e-05, "loss": 0.0056, "step": 172450 }, { "epoch": 1.86, "learning_rate": 2.034118181228514e-05, "loss": 0.0066, "step": 172460 }, { "epoch": 1.86, "learning_rate": 2.0324965946682234e-05, "loss": 0.0067, "step": 172470 }, { "epoch": 1.86, "learning_rate": 2.030875008107933e-05, "loss": 0.0087, "step": 172480 }, { "epoch": 1.86, "learning_rate": 2.0292534215476422e-05, "loss": 0.0074, "step": 172490 }, { "epoch": 1.86, "learning_rate": 2.0276318349873515e-05, "loss": 0.0045, "step": 172500 }, { "epoch": 1.86, "learning_rate": 2.026010248427061e-05, "loss": 0.0052, "step": 172510 }, { "epoch": 1.87, "learning_rate": 2.0243886618667704e-05, "loss": 0.0047, "step": 172520 }, { "epoch": 1.87, "learning_rate": 2.0227670753064797e-05, "loss": 0.0054, "step": 172530 }, { "epoch": 1.87, "learning_rate": 2.0211454887461893e-05, "loss": 0.0075, "step": 172540 }, { "epoch": 1.87, "learning_rate": 2.0195239021858986e-05, "loss": 0.0053, "step": 172550 }, { "epoch": 1.87, "learning_rate": 2.017902315625608e-05, "loss": 0.0049, "step": 172560 }, { "epoch": 1.87, "learning_rate": 2.0162807290653174e-05, "loss": 0.0074, "step": 172570 }, { "epoch": 1.87, "learning_rate": 2.0146591425050267e-05, "loss": 0.0066, "step": 172580 }, { "epoch": 1.87, "learning_rate": 2.0130375559447363e-05, "loss": 0.0057, "step": 172590 }, { "epoch": 1.87, "learning_rate": 2.0114159693844456e-05, "loss": 0.005, "step": 172600 }, { "epoch": 1.87, "learning_rate": 2.009794382824155e-05, "loss": 0.007, "step": 172610 }, { "epoch": 1.87, "learning_rate": 2.0081727962638645e-05, "loss": 0.0069, "step": 172620 }, { "epoch": 1.87, "learning_rate": 2.0065512097035738e-05, "loss": 0.0071, "step": 172630 }, { "epoch": 1.87, "learning_rate": 2.004929623143283e-05, "loss": 0.0065, "step": 172640 }, { "epoch": 1.87, "learning_rate": 2.0033080365829927e-05, "loss": 0.0073, "step": 172650 }, { "epoch": 1.87, "learning_rate": 2.001686450022702e-05, "loss": 0.0053, "step": 172660 }, { "epoch": 1.87, "learning_rate": 2.0000648634624115e-05, "loss": 0.0068, "step": 172670 }, { "epoch": 1.87, "learning_rate": 1.9984432769021208e-05, "loss": 0.0059, "step": 172680 }, { "epoch": 1.87, "learning_rate": 1.99682169034183e-05, "loss": 0.0067, "step": 172690 }, { "epoch": 1.87, "learning_rate": 1.9952001037815397e-05, "loss": 0.007, "step": 172700 }, { "epoch": 1.87, "learning_rate": 1.993578517221249e-05, "loss": 0.0112, "step": 172710 }, { "epoch": 1.87, "learning_rate": 1.9919569306609583e-05, "loss": 0.0088, "step": 172720 }, { "epoch": 1.87, "learning_rate": 1.990335344100668e-05, "loss": 0.0061, "step": 172730 }, { "epoch": 1.87, "learning_rate": 1.988713757540377e-05, "loss": 0.0053, "step": 172740 }, { "epoch": 1.87, "learning_rate": 1.9870921709800868e-05, "loss": 0.0054, "step": 172750 }, { "epoch": 1.87, "learning_rate": 1.985470584419796e-05, "loss": 0.005, "step": 172760 }, { "epoch": 1.87, "learning_rate": 1.9838489978595053e-05, "loss": 0.0057, "step": 172770 }, { "epoch": 1.87, "learning_rate": 1.982227411299215e-05, "loss": 0.0077, "step": 172780 }, { "epoch": 1.87, "learning_rate": 1.9806058247389242e-05, "loss": 0.0072, "step": 172790 }, { "epoch": 1.87, "learning_rate": 1.9789842381786335e-05, "loss": 0.007, "step": 172800 }, { "epoch": 1.87, "learning_rate": 1.977362651618343e-05, "loss": 0.0085, "step": 172810 }, { "epoch": 1.87, "learning_rate": 1.9757410650580527e-05, "loss": 0.0057, "step": 172820 }, { "epoch": 1.87, "learning_rate": 1.9741194784977623e-05, "loss": 0.0046, "step": 172830 }, { "epoch": 1.87, "learning_rate": 1.9724978919374716e-05, "loss": 0.0061, "step": 172840 }, { "epoch": 1.87, "learning_rate": 1.970876305377181e-05, "loss": 0.0061, "step": 172850 }, { "epoch": 1.87, "learning_rate": 1.9692547188168905e-05, "loss": 0.0077, "step": 172860 }, { "epoch": 1.87, "learning_rate": 1.9676331322565997e-05, "loss": 0.0069, "step": 172870 }, { "epoch": 1.87, "learning_rate": 1.9660115456963094e-05, "loss": 0.0078, "step": 172880 }, { "epoch": 1.87, "learning_rate": 1.9643899591360186e-05, "loss": 0.0069, "step": 172890 }, { "epoch": 1.87, "learning_rate": 1.962768372575728e-05, "loss": 0.0063, "step": 172900 }, { "epoch": 1.87, "learning_rate": 1.9611467860154375e-05, "loss": 0.007, "step": 172910 }, { "epoch": 1.87, "learning_rate": 1.9595251994551468e-05, "loss": 0.0071, "step": 172920 }, { "epoch": 1.87, "learning_rate": 1.957903612894856e-05, "loss": 0.0114, "step": 172930 }, { "epoch": 1.87, "learning_rate": 1.9562820263345657e-05, "loss": 0.0064, "step": 172940 }, { "epoch": 1.87, "learning_rate": 1.954660439774275e-05, "loss": 0.0048, "step": 172950 }, { "epoch": 1.87, "learning_rate": 1.9530388532139846e-05, "loss": 0.0073, "step": 172960 }, { "epoch": 1.87, "learning_rate": 1.951417266653694e-05, "loss": 0.0072, "step": 172970 }, { "epoch": 1.87, "learning_rate": 1.949795680093403e-05, "loss": 0.0063, "step": 172980 }, { "epoch": 1.87, "learning_rate": 1.9481740935331127e-05, "loss": 0.0059, "step": 172990 }, { "epoch": 1.87, "learning_rate": 1.946552506972822e-05, "loss": 0.0077, "step": 173000 }, { "epoch": 1.87, "eval_cer": 0.921521722891336, "eval_loss": 0.00535942055284977, "eval_runtime": 121.276, "eval_samples_per_second": 16.491, "eval_steps_per_second": 4.123, "step": 173000 }, { "epoch": 1.87, "learning_rate": 1.9449309204125313e-05, "loss": 0.006, "step": 173010 }, { "epoch": 1.87, "learning_rate": 1.943309333852241e-05, "loss": 0.005, "step": 173020 }, { "epoch": 1.87, "learning_rate": 1.94168774729195e-05, "loss": 0.0049, "step": 173030 }, { "epoch": 1.87, "learning_rate": 1.9400661607316598e-05, "loss": 0.0069, "step": 173040 }, { "epoch": 1.87, "learning_rate": 1.938444574171369e-05, "loss": 0.0047, "step": 173050 }, { "epoch": 1.87, "learning_rate": 1.9368229876110783e-05, "loss": 0.0048, "step": 173060 }, { "epoch": 1.87, "learning_rate": 1.935201401050788e-05, "loss": 0.0075, "step": 173070 }, { "epoch": 1.87, "learning_rate": 1.9335798144904972e-05, "loss": 0.0054, "step": 173080 }, { "epoch": 1.87, "learning_rate": 1.9319582279302065e-05, "loss": 0.0061, "step": 173090 }, { "epoch": 1.87, "learning_rate": 1.930336641369916e-05, "loss": 0.0072, "step": 173100 }, { "epoch": 1.87, "learning_rate": 1.9287150548096254e-05, "loss": 0.0072, "step": 173110 }, { "epoch": 1.87, "learning_rate": 1.927093468249335e-05, "loss": 0.0059, "step": 173120 }, { "epoch": 1.87, "learning_rate": 1.9254718816890443e-05, "loss": 0.0056, "step": 173130 }, { "epoch": 1.87, "learning_rate": 1.9238502951287535e-05, "loss": 0.0064, "step": 173140 }, { "epoch": 1.87, "learning_rate": 1.922228708568463e-05, "loss": 0.0064, "step": 173150 }, { "epoch": 1.87, "learning_rate": 1.9206071220081724e-05, "loss": 0.005, "step": 173160 }, { "epoch": 1.87, "learning_rate": 1.9189855354478817e-05, "loss": 0.0063, "step": 173170 }, { "epoch": 1.87, "learning_rate": 1.9173639488875917e-05, "loss": 0.005, "step": 173180 }, { "epoch": 1.87, "learning_rate": 1.915742362327301e-05, "loss": 0.0068, "step": 173190 }, { "epoch": 1.87, "learning_rate": 1.9141207757670105e-05, "loss": 0.0072, "step": 173200 }, { "epoch": 1.87, "learning_rate": 1.9124991892067198e-05, "loss": 0.0071, "step": 173210 }, { "epoch": 1.87, "learning_rate": 1.910877602646429e-05, "loss": 0.0063, "step": 173220 }, { "epoch": 1.87, "learning_rate": 1.9092560160861387e-05, "loss": 0.0064, "step": 173230 }, { "epoch": 1.87, "learning_rate": 1.907634429525848e-05, "loss": 0.0059, "step": 173240 }, { "epoch": 1.87, "learning_rate": 1.9060128429655576e-05, "loss": 0.005, "step": 173250 }, { "epoch": 1.87, "learning_rate": 1.904391256405267e-05, "loss": 0.0061, "step": 173260 }, { "epoch": 1.87, "learning_rate": 1.902769669844976e-05, "loss": 0.0052, "step": 173270 }, { "epoch": 1.87, "learning_rate": 1.9011480832846858e-05, "loss": 0.0057, "step": 173280 }, { "epoch": 1.87, "learning_rate": 1.899526496724395e-05, "loss": 0.0062, "step": 173290 }, { "epoch": 1.87, "learning_rate": 1.8979049101641043e-05, "loss": 0.0067, "step": 173300 }, { "epoch": 1.87, "learning_rate": 1.896283323603814e-05, "loss": 0.0053, "step": 173310 }, { "epoch": 1.87, "learning_rate": 1.8946617370435232e-05, "loss": 0.006, "step": 173320 }, { "epoch": 1.87, "learning_rate": 1.8930401504832328e-05, "loss": 0.0081, "step": 173330 }, { "epoch": 1.87, "learning_rate": 1.891418563922942e-05, "loss": 0.0063, "step": 173340 }, { "epoch": 1.87, "learning_rate": 1.8897969773626514e-05, "loss": 0.0069, "step": 173350 }, { "epoch": 1.87, "learning_rate": 1.888175390802361e-05, "loss": 0.0076, "step": 173360 }, { "epoch": 1.87, "learning_rate": 1.8865538042420702e-05, "loss": 0.0053, "step": 173370 }, { "epoch": 1.87, "learning_rate": 1.8849322176817795e-05, "loss": 0.0062, "step": 173380 }, { "epoch": 1.87, "learning_rate": 1.883310631121489e-05, "loss": 0.0058, "step": 173390 }, { "epoch": 1.87, "learning_rate": 1.8816890445611984e-05, "loss": 0.0059, "step": 173400 }, { "epoch": 1.87, "learning_rate": 1.880067458000908e-05, "loss": 0.0122, "step": 173410 }, { "epoch": 1.87, "learning_rate": 1.8784458714406173e-05, "loss": 0.0058, "step": 173420 }, { "epoch": 1.87, "learning_rate": 1.8768242848803266e-05, "loss": 0.0053, "step": 173430 }, { "epoch": 1.87, "learning_rate": 1.8752026983200362e-05, "loss": 0.0054, "step": 173440 }, { "epoch": 1.88, "learning_rate": 1.8735811117597458e-05, "loss": 0.009, "step": 173450 }, { "epoch": 1.88, "learning_rate": 1.871959525199455e-05, "loss": 0.0065, "step": 173460 }, { "epoch": 1.88, "learning_rate": 1.8703379386391643e-05, "loss": 0.0065, "step": 173470 }, { "epoch": 1.88, "learning_rate": 1.868716352078874e-05, "loss": 0.0081, "step": 173480 }, { "epoch": 1.88, "learning_rate": 1.8670947655185832e-05, "loss": 0.0079, "step": 173490 }, { "epoch": 1.88, "learning_rate": 1.8654731789582925e-05, "loss": 0.0054, "step": 173500 }, { "epoch": 1.88, "learning_rate": 1.863851592398002e-05, "loss": 0.0054, "step": 173510 }, { "epoch": 1.88, "learning_rate": 1.8622300058377114e-05, "loss": 0.0085, "step": 173520 }, { "epoch": 1.88, "learning_rate": 1.860608419277421e-05, "loss": 0.005, "step": 173530 }, { "epoch": 1.88, "learning_rate": 1.8589868327171303e-05, "loss": 0.0055, "step": 173540 }, { "epoch": 1.88, "learning_rate": 1.8573652461568395e-05, "loss": 0.0057, "step": 173550 }, { "epoch": 1.88, "learning_rate": 1.855743659596549e-05, "loss": 0.0058, "step": 173560 }, { "epoch": 1.88, "learning_rate": 1.8541220730362584e-05, "loss": 0.0066, "step": 173570 }, { "epoch": 1.88, "learning_rate": 1.8525004864759677e-05, "loss": 0.0071, "step": 173580 }, { "epoch": 1.88, "learning_rate": 1.8508788999156773e-05, "loss": 0.0065, "step": 173590 }, { "epoch": 1.88, "learning_rate": 1.8492573133553866e-05, "loss": 0.0048, "step": 173600 }, { "epoch": 1.88, "learning_rate": 1.8476357267950962e-05, "loss": 0.005, "step": 173610 }, { "epoch": 1.88, "learning_rate": 1.8460141402348055e-05, "loss": 0.0063, "step": 173620 }, { "epoch": 1.88, "learning_rate": 1.844392553674515e-05, "loss": 0.0054, "step": 173630 }, { "epoch": 1.88, "learning_rate": 1.8427709671142244e-05, "loss": 0.0077, "step": 173640 }, { "epoch": 1.88, "learning_rate": 1.841149380553934e-05, "loss": 0.0069, "step": 173650 }, { "epoch": 1.88, "learning_rate": 1.8395277939936433e-05, "loss": 0.0074, "step": 173660 }, { "epoch": 1.88, "learning_rate": 1.8379062074333525e-05, "loss": 0.0088, "step": 173670 }, { "epoch": 1.88, "learning_rate": 1.836284620873062e-05, "loss": 0.0054, "step": 173680 }, { "epoch": 1.88, "learning_rate": 1.8346630343127714e-05, "loss": 0.0072, "step": 173690 }, { "epoch": 1.88, "learning_rate": 1.833041447752481e-05, "loss": 0.0066, "step": 173700 }, { "epoch": 1.88, "learning_rate": 1.8314198611921903e-05, "loss": 0.0051, "step": 173710 }, { "epoch": 1.88, "learning_rate": 1.8297982746318996e-05, "loss": 0.0053, "step": 173720 }, { "epoch": 1.88, "learning_rate": 1.8281766880716092e-05, "loss": 0.0062, "step": 173730 }, { "epoch": 1.88, "learning_rate": 1.8265551015113185e-05, "loss": 0.0058, "step": 173740 }, { "epoch": 1.88, "learning_rate": 1.8249335149510277e-05, "loss": 0.0054, "step": 173750 }, { "epoch": 1.88, "learning_rate": 1.8233119283907374e-05, "loss": 0.0065, "step": 173760 }, { "epoch": 1.88, "learning_rate": 1.8216903418304466e-05, "loss": 0.0061, "step": 173770 }, { "epoch": 1.88, "learning_rate": 1.8200687552701562e-05, "loss": 0.0057, "step": 173780 }, { "epoch": 1.88, "learning_rate": 1.8184471687098655e-05, "loss": 0.0045, "step": 173790 }, { "epoch": 1.88, "learning_rate": 1.8168255821495748e-05, "loss": 0.0086, "step": 173800 }, { "epoch": 1.88, "learning_rate": 1.8152039955892844e-05, "loss": 0.0052, "step": 173810 }, { "epoch": 1.88, "learning_rate": 1.813582409028994e-05, "loss": 0.0081, "step": 173820 }, { "epoch": 1.88, "learning_rate": 1.8119608224687033e-05, "loss": 0.0066, "step": 173830 }, { "epoch": 1.88, "learning_rate": 1.8103392359084126e-05, "loss": 0.0047, "step": 173840 }, { "epoch": 1.88, "learning_rate": 1.8087176493481222e-05, "loss": 0.0055, "step": 173850 }, { "epoch": 1.88, "learning_rate": 1.8070960627878315e-05, "loss": 0.0072, "step": 173860 }, { "epoch": 1.88, "learning_rate": 1.8054744762275407e-05, "loss": 0.0056, "step": 173870 }, { "epoch": 1.88, "learning_rate": 1.8038528896672503e-05, "loss": 0.0056, "step": 173880 }, { "epoch": 1.88, "learning_rate": 1.8022313031069596e-05, "loss": 0.0082, "step": 173890 }, { "epoch": 1.88, "learning_rate": 1.8006097165466692e-05, "loss": 0.0076, "step": 173900 }, { "epoch": 1.88, "learning_rate": 1.7989881299863785e-05, "loss": 0.0071, "step": 173910 }, { "epoch": 1.88, "learning_rate": 1.7973665434260878e-05, "loss": 0.0061, "step": 173920 }, { "epoch": 1.88, "learning_rate": 1.7957449568657974e-05, "loss": 0.0053, "step": 173930 }, { "epoch": 1.88, "learning_rate": 1.7941233703055067e-05, "loss": 0.0049, "step": 173940 }, { "epoch": 1.88, "learning_rate": 1.792501783745216e-05, "loss": 0.0082, "step": 173950 }, { "epoch": 1.88, "learning_rate": 1.7908801971849256e-05, "loss": 0.0065, "step": 173960 }, { "epoch": 1.88, "learning_rate": 1.789258610624635e-05, "loss": 0.0073, "step": 173970 }, { "epoch": 1.88, "learning_rate": 1.7876370240643444e-05, "loss": 0.0055, "step": 173980 }, { "epoch": 1.88, "learning_rate": 1.786015437504054e-05, "loss": 0.0045, "step": 173990 }, { "epoch": 1.88, "learning_rate": 1.7843938509437633e-05, "loss": 0.0053, "step": 174000 }, { "epoch": 1.88, "eval_cer": 0.9215086938469904, "eval_loss": 0.005281680729240179, "eval_runtime": 121.3681, "eval_samples_per_second": 16.479, "eval_steps_per_second": 4.12, "step": 174000 }, { "epoch": 1.88, "learning_rate": 1.7827722643834726e-05, "loss": 0.0084, "step": 174010 }, { "epoch": 1.88, "learning_rate": 1.7811506778231822e-05, "loss": 0.0061, "step": 174020 }, { "epoch": 1.88, "learning_rate": 1.7795290912628915e-05, "loss": 0.0061, "step": 174030 }, { "epoch": 1.88, "learning_rate": 1.7779075047026008e-05, "loss": 0.0067, "step": 174040 }, { "epoch": 1.88, "learning_rate": 1.7762859181423104e-05, "loss": 0.0066, "step": 174050 }, { "epoch": 1.88, "learning_rate": 1.7746643315820197e-05, "loss": 0.0061, "step": 174060 }, { "epoch": 1.88, "learning_rate": 1.7730427450217293e-05, "loss": 0.0083, "step": 174070 }, { "epoch": 1.88, "learning_rate": 1.7714211584614385e-05, "loss": 0.0115, "step": 174080 }, { "epoch": 1.88, "learning_rate": 1.7697995719011478e-05, "loss": 0.0049, "step": 174090 }, { "epoch": 1.88, "learning_rate": 1.7681779853408574e-05, "loss": 0.0065, "step": 174100 }, { "epoch": 1.88, "learning_rate": 1.7665563987805667e-05, "loss": 0.0066, "step": 174110 }, { "epoch": 1.88, "learning_rate": 1.764934812220276e-05, "loss": 0.0063, "step": 174120 }, { "epoch": 1.88, "learning_rate": 1.7633132256599856e-05, "loss": 0.0058, "step": 174130 }, { "epoch": 1.88, "learning_rate": 1.761691639099695e-05, "loss": 0.006, "step": 174140 }, { "epoch": 1.88, "learning_rate": 1.760070052539404e-05, "loss": 0.0065, "step": 174150 }, { "epoch": 1.88, "learning_rate": 1.7584484659791138e-05, "loss": 0.0055, "step": 174160 }, { "epoch": 1.88, "learning_rate": 1.7568268794188234e-05, "loss": 0.0055, "step": 174170 }, { "epoch": 1.88, "learning_rate": 1.7552052928585326e-05, "loss": 0.0055, "step": 174180 }, { "epoch": 1.88, "learning_rate": 1.7535837062982423e-05, "loss": 0.0062, "step": 174190 }, { "epoch": 1.88, "learning_rate": 1.7519621197379515e-05, "loss": 0.0091, "step": 174200 }, { "epoch": 1.88, "learning_rate": 1.7503405331776608e-05, "loss": 0.006, "step": 174210 }, { "epoch": 1.88, "learning_rate": 1.7487189466173704e-05, "loss": 0.006, "step": 174220 }, { "epoch": 1.88, "learning_rate": 1.7470973600570797e-05, "loss": 0.0057, "step": 174230 }, { "epoch": 1.88, "learning_rate": 1.745475773496789e-05, "loss": 0.0071, "step": 174240 }, { "epoch": 1.88, "learning_rate": 1.7438541869364986e-05, "loss": 0.0072, "step": 174250 }, { "epoch": 1.88, "learning_rate": 1.742232600376208e-05, "loss": 0.006, "step": 174260 }, { "epoch": 1.88, "learning_rate": 1.7406110138159175e-05, "loss": 0.0072, "step": 174270 }, { "epoch": 1.88, "learning_rate": 1.7389894272556267e-05, "loss": 0.0044, "step": 174280 }, { "epoch": 1.88, "learning_rate": 1.737367840695336e-05, "loss": 0.0084, "step": 174290 }, { "epoch": 1.88, "learning_rate": 1.7357462541350456e-05, "loss": 0.0067, "step": 174300 }, { "epoch": 1.88, "learning_rate": 1.734124667574755e-05, "loss": 0.0085, "step": 174310 }, { "epoch": 1.88, "learning_rate": 1.7325030810144642e-05, "loss": 0.0057, "step": 174320 }, { "epoch": 1.88, "learning_rate": 1.7308814944541738e-05, "loss": 0.0059, "step": 174330 }, { "epoch": 1.88, "learning_rate": 1.729259907893883e-05, "loss": 0.0062, "step": 174340 }, { "epoch": 1.88, "learning_rate": 1.7276383213335927e-05, "loss": 0.0051, "step": 174350 }, { "epoch": 1.88, "learning_rate": 1.7260167347733023e-05, "loss": 0.0084, "step": 174360 }, { "epoch": 1.89, "learning_rate": 1.7243951482130116e-05, "loss": 0.0056, "step": 174370 }, { "epoch": 1.89, "learning_rate": 1.722773561652721e-05, "loss": 0.0055, "step": 174380 }, { "epoch": 1.89, "learning_rate": 1.7211519750924305e-05, "loss": 0.005, "step": 174390 }, { "epoch": 1.89, "learning_rate": 1.7195303885321397e-05, "loss": 0.0058, "step": 174400 }, { "epoch": 1.89, "learning_rate": 1.717908801971849e-05, "loss": 0.0078, "step": 174410 }, { "epoch": 1.89, "learning_rate": 1.7162872154115586e-05, "loss": 0.0071, "step": 174420 }, { "epoch": 1.89, "learning_rate": 1.714665628851268e-05, "loss": 0.0049, "step": 174430 }, { "epoch": 1.89, "learning_rate": 1.713044042290977e-05, "loss": 0.0064, "step": 174440 }, { "epoch": 1.89, "learning_rate": 1.7114224557306868e-05, "loss": 0.0055, "step": 174450 }, { "epoch": 1.89, "learning_rate": 1.709800869170396e-05, "loss": 0.0086, "step": 174460 }, { "epoch": 1.89, "learning_rate": 1.7081792826101057e-05, "loss": 0.005, "step": 174470 }, { "epoch": 1.89, "learning_rate": 1.706557696049815e-05, "loss": 0.006, "step": 174480 }, { "epoch": 1.89, "learning_rate": 1.7049361094895242e-05, "loss": 0.0063, "step": 174490 }, { "epoch": 1.89, "learning_rate": 1.7033145229292338e-05, "loss": 0.0062, "step": 174500 }, { "epoch": 1.89, "learning_rate": 1.701692936368943e-05, "loss": 0.0051, "step": 174510 }, { "epoch": 1.89, "learning_rate": 1.7000713498086524e-05, "loss": 0.0063, "step": 174520 }, { "epoch": 1.89, "learning_rate": 1.698449763248362e-05, "loss": 0.0058, "step": 174530 }, { "epoch": 1.89, "learning_rate": 1.6968281766880716e-05, "loss": 0.0086, "step": 174540 }, { "epoch": 1.89, "learning_rate": 1.695206590127781e-05, "loss": 0.0053, "step": 174550 }, { "epoch": 1.89, "learning_rate": 1.6935850035674905e-05, "loss": 0.0061, "step": 174560 }, { "epoch": 1.89, "learning_rate": 1.6919634170071998e-05, "loss": 0.0065, "step": 174570 }, { "epoch": 1.89, "learning_rate": 1.690341830446909e-05, "loss": 0.0065, "step": 174580 }, { "epoch": 1.89, "learning_rate": 1.6887202438866187e-05, "loss": 0.0077, "step": 174590 }, { "epoch": 1.89, "learning_rate": 1.687098657326328e-05, "loss": 0.0076, "step": 174600 }, { "epoch": 1.89, "learning_rate": 1.6854770707660372e-05, "loss": 0.004, "step": 174610 }, { "epoch": 1.89, "learning_rate": 1.6838554842057468e-05, "loss": 0.0061, "step": 174620 }, { "epoch": 1.89, "learning_rate": 1.682233897645456e-05, "loss": 0.0075, "step": 174630 }, { "epoch": 1.89, "learning_rate": 1.6806123110851657e-05, "loss": 0.0069, "step": 174640 }, { "epoch": 1.89, "learning_rate": 1.678990724524875e-05, "loss": 0.0075, "step": 174650 }, { "epoch": 1.89, "learning_rate": 1.6773691379645842e-05, "loss": 0.0064, "step": 174660 }, { "epoch": 1.89, "learning_rate": 1.675747551404294e-05, "loss": 0.007, "step": 174670 }, { "epoch": 1.89, "learning_rate": 1.674125964844003e-05, "loss": 0.0064, "step": 174680 }, { "epoch": 1.89, "learning_rate": 1.6725043782837124e-05, "loss": 0.0052, "step": 174690 }, { "epoch": 1.89, "learning_rate": 1.670882791723422e-05, "loss": 0.0075, "step": 174700 }, { "epoch": 1.89, "learning_rate": 1.6692612051631316e-05, "loss": 0.007, "step": 174710 }, { "epoch": 1.89, "learning_rate": 1.667639618602841e-05, "loss": 0.0054, "step": 174720 }, { "epoch": 1.89, "learning_rate": 1.6660180320425505e-05, "loss": 0.007, "step": 174730 }, { "epoch": 1.89, "learning_rate": 1.6643964454822598e-05, "loss": 0.006, "step": 174740 }, { "epoch": 1.89, "learning_rate": 1.662774858921969e-05, "loss": 0.0062, "step": 174750 }, { "epoch": 1.89, "learning_rate": 1.6611532723616787e-05, "loss": 0.0067, "step": 174760 }, { "epoch": 1.89, "learning_rate": 1.659531685801388e-05, "loss": 0.0054, "step": 174770 }, { "epoch": 1.89, "learning_rate": 1.6579100992410972e-05, "loss": 0.0053, "step": 174780 }, { "epoch": 1.89, "learning_rate": 1.656288512680807e-05, "loss": 0.0068, "step": 174790 }, { "epoch": 1.89, "learning_rate": 1.654666926120516e-05, "loss": 0.0068, "step": 174800 }, { "epoch": 1.89, "learning_rate": 1.6530453395602254e-05, "loss": 0.0038, "step": 174810 }, { "epoch": 1.89, "learning_rate": 1.651423752999935e-05, "loss": 0.0055, "step": 174820 }, { "epoch": 1.89, "learning_rate": 1.6498021664396443e-05, "loss": 0.0058, "step": 174830 }, { "epoch": 1.89, "learning_rate": 1.648180579879354e-05, "loss": 0.0066, "step": 174840 }, { "epoch": 1.89, "learning_rate": 1.6465589933190632e-05, "loss": 0.0083, "step": 174850 }, { "epoch": 1.89, "learning_rate": 1.6449374067587724e-05, "loss": 0.0058, "step": 174860 }, { "epoch": 1.89, "learning_rate": 1.643315820198482e-05, "loss": 0.0047, "step": 174870 }, { "epoch": 1.89, "learning_rate": 1.6416942336381917e-05, "loss": 0.004, "step": 174880 }, { "epoch": 1.89, "learning_rate": 1.640072647077901e-05, "loss": 0.0085, "step": 174890 }, { "epoch": 1.89, "learning_rate": 1.6384510605176102e-05, "loss": 0.0047, "step": 174900 }, { "epoch": 1.89, "learning_rate": 1.63682947395732e-05, "loss": 0.0077, "step": 174910 }, { "epoch": 1.89, "learning_rate": 1.635207887397029e-05, "loss": 0.0067, "step": 174920 }, { "epoch": 1.89, "learning_rate": 1.6335863008367387e-05, "loss": 0.0075, "step": 174930 }, { "epoch": 1.89, "learning_rate": 1.631964714276448e-05, "loss": 0.0064, "step": 174940 }, { "epoch": 1.89, "learning_rate": 1.6303431277161573e-05, "loss": 0.0062, "step": 174950 }, { "epoch": 1.89, "learning_rate": 1.628721541155867e-05, "loss": 0.0086, "step": 174960 }, { "epoch": 1.89, "learning_rate": 1.627099954595576e-05, "loss": 0.0055, "step": 174970 }, { "epoch": 1.89, "learning_rate": 1.6254783680352854e-05, "loss": 0.007, "step": 174980 }, { "epoch": 1.89, "learning_rate": 1.623856781474995e-05, "loss": 0.0067, "step": 174990 }, { "epoch": 1.89, "learning_rate": 1.6222351949147043e-05, "loss": 0.0067, "step": 175000 }, { "epoch": 1.89, "eval_cer": 0.9215121682588159, "eval_loss": 0.005301313009113073, "eval_runtime": 121.5762, "eval_samples_per_second": 16.451, "eval_steps_per_second": 4.113, "step": 175000 }, { "epoch": 1.89, "learning_rate": 1.620613608354414e-05, "loss": 0.0065, "step": 175010 }, { "epoch": 1.89, "learning_rate": 1.6189920217941232e-05, "loss": 0.0077, "step": 175020 }, { "epoch": 1.89, "learning_rate": 1.6173704352338325e-05, "loss": 0.005, "step": 175030 }, { "epoch": 1.89, "learning_rate": 1.615748848673542e-05, "loss": 0.0057, "step": 175040 }, { "epoch": 1.89, "learning_rate": 1.6141272621132514e-05, "loss": 0.0046, "step": 175050 }, { "epoch": 1.89, "learning_rate": 1.612505675552961e-05, "loss": 0.0061, "step": 175060 }, { "epoch": 1.89, "learning_rate": 1.6108840889926703e-05, "loss": 0.0059, "step": 175070 }, { "epoch": 1.89, "learning_rate": 1.60926250243238e-05, "loss": 0.0083, "step": 175080 }, { "epoch": 1.89, "learning_rate": 1.607640915872089e-05, "loss": 0.0074, "step": 175090 }, { "epoch": 1.89, "learning_rate": 1.6060193293117984e-05, "loss": 0.0063, "step": 175100 }, { "epoch": 1.89, "learning_rate": 1.604397742751508e-05, "loss": 0.0108, "step": 175110 }, { "epoch": 1.89, "learning_rate": 1.6027761561912173e-05, "loss": 0.0068, "step": 175120 }, { "epoch": 1.89, "learning_rate": 1.601154569630927e-05, "loss": 0.0072, "step": 175130 }, { "epoch": 1.89, "learning_rate": 1.5995329830706362e-05, "loss": 0.0056, "step": 175140 }, { "epoch": 1.89, "learning_rate": 1.5979113965103455e-05, "loss": 0.0067, "step": 175150 }, { "epoch": 1.89, "learning_rate": 1.596289809950055e-05, "loss": 0.0068, "step": 175160 }, { "epoch": 1.89, "learning_rate": 1.5946682233897644e-05, "loss": 0.0082, "step": 175170 }, { "epoch": 1.89, "learning_rate": 1.5930466368294736e-05, "loss": 0.0071, "step": 175180 }, { "epoch": 1.89, "learning_rate": 1.5914250502691832e-05, "loss": 0.0055, "step": 175190 }, { "epoch": 1.89, "learning_rate": 1.5898034637088925e-05, "loss": 0.0081, "step": 175200 }, { "epoch": 1.89, "learning_rate": 1.588181877148602e-05, "loss": 0.0079, "step": 175210 }, { "epoch": 1.89, "learning_rate": 1.5865602905883114e-05, "loss": 0.0079, "step": 175220 }, { "epoch": 1.89, "learning_rate": 1.5849387040280207e-05, "loss": 0.0073, "step": 175230 }, { "epoch": 1.89, "learning_rate": 1.5833171174677303e-05, "loss": 0.0059, "step": 175240 }, { "epoch": 1.89, "learning_rate": 1.58169553090744e-05, "loss": 0.0067, "step": 175250 }, { "epoch": 1.89, "learning_rate": 1.5800739443471492e-05, "loss": 0.0075, "step": 175260 }, { "epoch": 1.89, "learning_rate": 1.5784523577868585e-05, "loss": 0.006, "step": 175270 }, { "epoch": 1.89, "learning_rate": 1.576830771226568e-05, "loss": 0.008, "step": 175280 }, { "epoch": 1.89, "learning_rate": 1.5752091846662773e-05, "loss": 0.009, "step": 175290 }, { "epoch": 1.9, "learning_rate": 1.573587598105987e-05, "loss": 0.0051, "step": 175300 }, { "epoch": 1.9, "learning_rate": 1.5719660115456962e-05, "loss": 0.0059, "step": 175310 }, { "epoch": 1.9, "learning_rate": 1.5703444249854055e-05, "loss": 0.0062, "step": 175320 }, { "epoch": 1.9, "learning_rate": 1.568722838425115e-05, "loss": 0.0072, "step": 175330 }, { "epoch": 1.9, "learning_rate": 1.5671012518648244e-05, "loss": 0.0072, "step": 175340 }, { "epoch": 1.9, "learning_rate": 1.5654796653045337e-05, "loss": 0.0086, "step": 175350 }, { "epoch": 1.9, "learning_rate": 1.5638580787442433e-05, "loss": 0.0076, "step": 175360 }, { "epoch": 1.9, "learning_rate": 1.5622364921839526e-05, "loss": 0.0082, "step": 175370 }, { "epoch": 1.9, "learning_rate": 1.5606149056236618e-05, "loss": 0.0065, "step": 175380 }, { "epoch": 1.9, "learning_rate": 1.5589933190633714e-05, "loss": 0.0057, "step": 175390 }, { "epoch": 1.9, "learning_rate": 1.5573717325030807e-05, "loss": 0.0062, "step": 175400 }, { "epoch": 1.9, "learning_rate": 1.5557501459427903e-05, "loss": 0.0065, "step": 175410 }, { "epoch": 1.9, "learning_rate": 1.5541285593825e-05, "loss": 0.0065, "step": 175420 }, { "epoch": 1.9, "learning_rate": 1.5525069728222092e-05, "loss": 0.0048, "step": 175430 }, { "epoch": 1.9, "learning_rate": 1.5508853862619185e-05, "loss": 0.0069, "step": 175440 }, { "epoch": 1.9, "learning_rate": 1.549263799701628e-05, "loss": 0.0062, "step": 175450 }, { "epoch": 1.9, "learning_rate": 1.5476422131413374e-05, "loss": 0.0069, "step": 175460 }, { "epoch": 1.9, "learning_rate": 1.5460206265810467e-05, "loss": 0.008, "step": 175470 }, { "epoch": 1.9, "learning_rate": 1.5443990400207563e-05, "loss": 0.0045, "step": 175480 }, { "epoch": 1.9, "learning_rate": 1.5427774534604655e-05, "loss": 0.0078, "step": 175490 }, { "epoch": 1.9, "learning_rate": 1.541155866900175e-05, "loss": 0.0044, "step": 175500 }, { "epoch": 1.9, "learning_rate": 1.5395342803398844e-05, "loss": 0.0089, "step": 175510 }, { "epoch": 1.9, "learning_rate": 1.5379126937795937e-05, "loss": 0.0067, "step": 175520 }, { "epoch": 1.9, "learning_rate": 1.5362911072193033e-05, "loss": 0.0064, "step": 175530 }, { "epoch": 1.9, "learning_rate": 1.5346695206590126e-05, "loss": 0.007, "step": 175540 }, { "epoch": 1.9, "learning_rate": 1.533047934098722e-05, "loss": 0.0062, "step": 175550 }, { "epoch": 1.9, "learning_rate": 1.5314263475384315e-05, "loss": 0.0063, "step": 175560 }, { "epoch": 1.9, "learning_rate": 1.5298047609781407e-05, "loss": 0.0081, "step": 175570 }, { "epoch": 1.9, "learning_rate": 1.5281831744178504e-05, "loss": 0.006, "step": 175580 }, { "epoch": 1.9, "learning_rate": 1.5265615878575596e-05, "loss": 0.0066, "step": 175590 }, { "epoch": 1.9, "learning_rate": 1.5249400012972693e-05, "loss": 0.006, "step": 175600 }, { "epoch": 1.9, "learning_rate": 1.5233184147369787e-05, "loss": 0.0053, "step": 175610 }, { "epoch": 1.9, "learning_rate": 1.521696828176688e-05, "loss": 0.0054, "step": 175620 }, { "epoch": 1.9, "learning_rate": 1.5200752416163974e-05, "loss": 0.0064, "step": 175630 }, { "epoch": 1.9, "learning_rate": 1.5184536550561069e-05, "loss": 0.0058, "step": 175640 }, { "epoch": 1.9, "learning_rate": 1.5168320684958163e-05, "loss": 0.0051, "step": 175650 }, { "epoch": 1.9, "learning_rate": 1.5152104819355256e-05, "loss": 0.0051, "step": 175660 }, { "epoch": 1.9, "learning_rate": 1.513588895375235e-05, "loss": 0.0068, "step": 175670 }, { "epoch": 1.9, "learning_rate": 1.5119673088149445e-05, "loss": 0.006, "step": 175680 }, { "epoch": 1.9, "learning_rate": 1.5103457222546537e-05, "loss": 0.0077, "step": 175690 }, { "epoch": 1.9, "learning_rate": 1.5087241356943632e-05, "loss": 0.0056, "step": 175700 }, { "epoch": 1.9, "learning_rate": 1.5071025491340726e-05, "loss": 0.0058, "step": 175710 }, { "epoch": 1.9, "learning_rate": 1.505480962573782e-05, "loss": 0.0045, "step": 175720 }, { "epoch": 1.9, "learning_rate": 1.5038593760134913e-05, "loss": 0.0069, "step": 175730 }, { "epoch": 1.9, "learning_rate": 1.5022377894532008e-05, "loss": 0.0061, "step": 175740 }, { "epoch": 1.9, "learning_rate": 1.5006162028929102e-05, "loss": 0.0059, "step": 175750 }, { "epoch": 1.9, "learning_rate": 1.4989946163326197e-05, "loss": 0.0055, "step": 175760 }, { "epoch": 1.9, "learning_rate": 1.497373029772329e-05, "loss": 0.0063, "step": 175770 }, { "epoch": 1.9, "learning_rate": 1.4957514432120386e-05, "loss": 0.0072, "step": 175780 }, { "epoch": 1.9, "learning_rate": 1.494129856651748e-05, "loss": 0.0061, "step": 175790 }, { "epoch": 1.9, "learning_rate": 1.4925082700914574e-05, "loss": 0.0081, "step": 175800 }, { "epoch": 1.9, "learning_rate": 1.4908866835311669e-05, "loss": 0.0062, "step": 175810 }, { "epoch": 1.9, "learning_rate": 1.4892650969708762e-05, "loss": 0.0065, "step": 175820 }, { "epoch": 1.9, "learning_rate": 1.4876435104105856e-05, "loss": 0.005, "step": 175830 }, { "epoch": 1.9, "learning_rate": 1.486021923850295e-05, "loss": 0.0059, "step": 175840 }, { "epoch": 1.9, "learning_rate": 1.4844003372900045e-05, "loss": 0.0081, "step": 175850 }, { "epoch": 1.9, "learning_rate": 1.4827787507297138e-05, "loss": 0.0061, "step": 175860 }, { "epoch": 1.9, "learning_rate": 1.4811571641694232e-05, "loss": 0.0066, "step": 175870 }, { "epoch": 1.9, "learning_rate": 1.4795355776091327e-05, "loss": 0.0067, "step": 175880 }, { "epoch": 1.9, "learning_rate": 1.4779139910488421e-05, "loss": 0.0067, "step": 175890 }, { "epoch": 1.9, "learning_rate": 1.4762924044885514e-05, "loss": 0.0059, "step": 175900 }, { "epoch": 1.9, "learning_rate": 1.4746708179282608e-05, "loss": 0.0073, "step": 175910 }, { "epoch": 1.9, "learning_rate": 1.4730492313679703e-05, "loss": 0.0056, "step": 175920 }, { "epoch": 1.9, "learning_rate": 1.4714276448076797e-05, "loss": 0.0062, "step": 175930 }, { "epoch": 1.9, "learning_rate": 1.469806058247389e-05, "loss": 0.0055, "step": 175940 }, { "epoch": 1.9, "learning_rate": 1.4681844716870984e-05, "loss": 0.0051, "step": 175950 }, { "epoch": 1.9, "learning_rate": 1.466562885126808e-05, "loss": 0.0047, "step": 175960 }, { "epoch": 1.9, "learning_rate": 1.4649412985665175e-05, "loss": 0.0068, "step": 175970 }, { "epoch": 1.9, "learning_rate": 1.463319712006227e-05, "loss": 0.0054, "step": 175980 }, { "epoch": 1.9, "learning_rate": 1.4616981254459362e-05, "loss": 0.005, "step": 175990 }, { "epoch": 1.9, "learning_rate": 1.4600765388856456e-05, "loss": 0.0066, "step": 176000 }, { "epoch": 1.9, "eval_cer": 0.9215026136262957, "eval_loss": 0.005302069243043661, "eval_runtime": 121.5231, "eval_samples_per_second": 16.458, "eval_steps_per_second": 4.114, "step": 176000 }, { "epoch": 1.9, "learning_rate": 1.4584549523253551e-05, "loss": 0.0056, "step": 176010 }, { "epoch": 1.9, "learning_rate": 1.4568333657650644e-05, "loss": 0.0059, "step": 176020 }, { "epoch": 1.9, "learning_rate": 1.4552117792047738e-05, "loss": 0.0064, "step": 176030 }, { "epoch": 1.9, "learning_rate": 1.4535901926444833e-05, "loss": 0.0051, "step": 176040 }, { "epoch": 1.9, "learning_rate": 1.4519686060841927e-05, "loss": 0.0065, "step": 176050 }, { "epoch": 1.9, "learning_rate": 1.450347019523902e-05, "loss": 0.0064, "step": 176060 }, { "epoch": 1.9, "learning_rate": 1.4487254329636114e-05, "loss": 0.0059, "step": 176070 }, { "epoch": 1.9, "learning_rate": 1.4471038464033209e-05, "loss": 0.0068, "step": 176080 }, { "epoch": 1.9, "learning_rate": 1.4454822598430303e-05, "loss": 0.0067, "step": 176090 }, { "epoch": 1.9, "learning_rate": 1.4438606732827396e-05, "loss": 0.0044, "step": 176100 }, { "epoch": 1.9, "learning_rate": 1.442239086722449e-05, "loss": 0.0049, "step": 176110 }, { "epoch": 1.9, "learning_rate": 1.4406175001621585e-05, "loss": 0.0059, "step": 176120 }, { "epoch": 1.9, "learning_rate": 1.4389959136018679e-05, "loss": 0.0049, "step": 176130 }, { "epoch": 1.9, "learning_rate": 1.4373743270415775e-05, "loss": 0.0065, "step": 176140 }, { "epoch": 1.9, "learning_rate": 1.4357527404812868e-05, "loss": 0.0085, "step": 176150 }, { "epoch": 1.9, "learning_rate": 1.4341311539209962e-05, "loss": 0.0059, "step": 176160 }, { "epoch": 1.9, "learning_rate": 1.4325095673607057e-05, "loss": 0.0073, "step": 176170 }, { "epoch": 1.9, "learning_rate": 1.4308879808004151e-05, "loss": 0.0047, "step": 176180 }, { "epoch": 1.9, "learning_rate": 1.4292663942401244e-05, "loss": 0.0086, "step": 176190 }, { "epoch": 1.9, "learning_rate": 1.4276448076798338e-05, "loss": 0.0048, "step": 176200 }, { "epoch": 1.9, "learning_rate": 1.4260232211195433e-05, "loss": 0.0064, "step": 176210 }, { "epoch": 1.91, "learning_rate": 1.4244016345592527e-05, "loss": 0.0064, "step": 176220 }, { "epoch": 1.91, "learning_rate": 1.422780047998962e-05, "loss": 0.0051, "step": 176230 }, { "epoch": 1.91, "learning_rate": 1.4211584614386714e-05, "loss": 0.0058, "step": 176240 }, { "epoch": 1.91, "learning_rate": 1.4195368748783809e-05, "loss": 0.007, "step": 176250 }, { "epoch": 1.91, "learning_rate": 1.4179152883180903e-05, "loss": 0.0066, "step": 176260 }, { "epoch": 1.91, "learning_rate": 1.4162937017577996e-05, "loss": 0.0055, "step": 176270 }, { "epoch": 1.91, "learning_rate": 1.414672115197509e-05, "loss": 0.008, "step": 176280 }, { "epoch": 1.91, "learning_rate": 1.4130505286372185e-05, "loss": 0.007, "step": 176290 }, { "epoch": 1.91, "learning_rate": 1.411428942076928e-05, "loss": 0.0073, "step": 176300 }, { "epoch": 1.91, "learning_rate": 1.4098073555166372e-05, "loss": 0.0063, "step": 176310 }, { "epoch": 1.91, "learning_rate": 1.4081857689563468e-05, "loss": 0.0061, "step": 176320 }, { "epoch": 1.91, "learning_rate": 1.4065641823960563e-05, "loss": 0.0055, "step": 176330 }, { "epoch": 1.91, "learning_rate": 1.4049425958357657e-05, "loss": 0.0088, "step": 176340 }, { "epoch": 1.91, "learning_rate": 1.403321009275475e-05, "loss": 0.0061, "step": 176350 }, { "epoch": 1.91, "learning_rate": 1.4016994227151844e-05, "loss": 0.008, "step": 176360 }, { "epoch": 1.91, "learning_rate": 1.4000778361548939e-05, "loss": 0.0067, "step": 176370 }, { "epoch": 1.91, "learning_rate": 1.3984562495946033e-05, "loss": 0.0064, "step": 176380 }, { "epoch": 1.91, "learning_rate": 1.3968346630343126e-05, "loss": 0.0051, "step": 176390 }, { "epoch": 1.91, "learning_rate": 1.395213076474022e-05, "loss": 0.0101, "step": 176400 }, { "epoch": 1.91, "learning_rate": 1.3935914899137315e-05, "loss": 0.0056, "step": 176410 }, { "epoch": 1.91, "learning_rate": 1.391969903353441e-05, "loss": 0.0058, "step": 176420 }, { "epoch": 1.91, "learning_rate": 1.3903483167931502e-05, "loss": 0.0079, "step": 176430 }, { "epoch": 1.91, "learning_rate": 1.3887267302328596e-05, "loss": 0.0057, "step": 176440 }, { "epoch": 1.91, "learning_rate": 1.3871051436725691e-05, "loss": 0.0041, "step": 176450 }, { "epoch": 1.91, "learning_rate": 1.3854835571122785e-05, "loss": 0.0058, "step": 176460 }, { "epoch": 1.91, "learning_rate": 1.3838619705519878e-05, "loss": 0.0064, "step": 176470 }, { "epoch": 1.91, "learning_rate": 1.3822403839916973e-05, "loss": 0.0063, "step": 176480 }, { "epoch": 1.91, "learning_rate": 1.3806187974314067e-05, "loss": 0.0069, "step": 176490 }, { "epoch": 1.91, "learning_rate": 1.3789972108711163e-05, "loss": 0.0056, "step": 176500 }, { "epoch": 1.91, "learning_rate": 1.3773756243108258e-05, "loss": 0.0055, "step": 176510 }, { "epoch": 1.91, "learning_rate": 1.375754037750535e-05, "loss": 0.0054, "step": 176520 }, { "epoch": 1.91, "learning_rate": 1.3741324511902445e-05, "loss": 0.0091, "step": 176530 }, { "epoch": 1.91, "learning_rate": 1.3725108646299539e-05, "loss": 0.0087, "step": 176540 }, { "epoch": 1.91, "learning_rate": 1.3708892780696634e-05, "loss": 0.0058, "step": 176550 }, { "epoch": 1.91, "learning_rate": 1.3692676915093726e-05, "loss": 0.0074, "step": 176560 }, { "epoch": 1.91, "learning_rate": 1.367646104949082e-05, "loss": 0.0073, "step": 176570 }, { "epoch": 1.91, "learning_rate": 1.3660245183887915e-05, "loss": 0.0067, "step": 176580 }, { "epoch": 1.91, "learning_rate": 1.364402931828501e-05, "loss": 0.0057, "step": 176590 }, { "epoch": 1.91, "learning_rate": 1.3627813452682102e-05, "loss": 0.0076, "step": 176600 }, { "epoch": 1.91, "learning_rate": 1.3611597587079197e-05, "loss": 0.0064, "step": 176610 }, { "epoch": 1.91, "learning_rate": 1.3595381721476291e-05, "loss": 0.0058, "step": 176620 }, { "epoch": 1.91, "learning_rate": 1.3579165855873386e-05, "loss": 0.006, "step": 176630 }, { "epoch": 1.91, "learning_rate": 1.3562949990270478e-05, "loss": 0.006, "step": 176640 }, { "epoch": 1.91, "learning_rate": 1.3546734124667573e-05, "loss": 0.0063, "step": 176650 }, { "epoch": 1.91, "learning_rate": 1.3530518259064667e-05, "loss": 0.0059, "step": 176660 }, { "epoch": 1.91, "learning_rate": 1.351430239346176e-05, "loss": 0.0049, "step": 176670 }, { "epoch": 1.91, "learning_rate": 1.3498086527858856e-05, "loss": 0.0081, "step": 176680 }, { "epoch": 1.91, "learning_rate": 1.348187066225595e-05, "loss": 0.0053, "step": 176690 }, { "epoch": 1.91, "learning_rate": 1.3465654796653045e-05, "loss": 0.0053, "step": 176700 }, { "epoch": 1.91, "learning_rate": 1.344943893105014e-05, "loss": 0.0065, "step": 176710 }, { "epoch": 1.91, "learning_rate": 1.3433223065447232e-05, "loss": 0.0056, "step": 176720 }, { "epoch": 1.91, "learning_rate": 1.3417007199844327e-05, "loss": 0.0059, "step": 176730 }, { "epoch": 1.91, "learning_rate": 1.3400791334241421e-05, "loss": 0.0078, "step": 176740 }, { "epoch": 1.91, "learning_rate": 1.3384575468638516e-05, "loss": 0.008, "step": 176750 }, { "epoch": 1.91, "learning_rate": 1.3368359603035608e-05, "loss": 0.0065, "step": 176760 }, { "epoch": 1.91, "learning_rate": 1.3352143737432703e-05, "loss": 0.0066, "step": 176770 }, { "epoch": 1.91, "learning_rate": 1.3335927871829797e-05, "loss": 0.0052, "step": 176780 }, { "epoch": 1.91, "learning_rate": 1.3319712006226892e-05, "loss": 0.0071, "step": 176790 }, { "epoch": 1.91, "learning_rate": 1.3303496140623984e-05, "loss": 0.0073, "step": 176800 }, { "epoch": 1.91, "learning_rate": 1.3287280275021079e-05, "loss": 0.0064, "step": 176810 }, { "epoch": 1.91, "learning_rate": 1.3271064409418173e-05, "loss": 0.0063, "step": 176820 }, { "epoch": 1.91, "learning_rate": 1.3254848543815268e-05, "loss": 0.0055, "step": 176830 }, { "epoch": 1.91, "learning_rate": 1.323863267821236e-05, "loss": 0.0064, "step": 176840 }, { "epoch": 1.91, "learning_rate": 1.3222416812609455e-05, "loss": 0.0053, "step": 176850 }, { "epoch": 1.91, "learning_rate": 1.3206200947006551e-05, "loss": 0.0051, "step": 176860 }, { "epoch": 1.91, "learning_rate": 1.3189985081403645e-05, "loss": 0.0086, "step": 176870 }, { "epoch": 1.91, "learning_rate": 1.317376921580074e-05, "loss": 0.0055, "step": 176880 }, { "epoch": 1.91, "learning_rate": 1.3157553350197833e-05, "loss": 0.0055, "step": 176890 }, { "epoch": 1.91, "learning_rate": 1.3141337484594927e-05, "loss": 0.0069, "step": 176900 }, { "epoch": 1.91, "learning_rate": 1.3125121618992021e-05, "loss": 0.0082, "step": 176910 }, { "epoch": 1.91, "learning_rate": 1.3108905753389116e-05, "loss": 0.0069, "step": 176920 }, { "epoch": 1.91, "learning_rate": 1.3092689887786209e-05, "loss": 0.0052, "step": 176930 }, { "epoch": 1.91, "learning_rate": 1.3076474022183303e-05, "loss": 0.005, "step": 176940 }, { "epoch": 1.91, "learning_rate": 1.3060258156580398e-05, "loss": 0.0058, "step": 176950 }, { "epoch": 1.91, "learning_rate": 1.304404229097749e-05, "loss": 0.004, "step": 176960 }, { "epoch": 1.91, "learning_rate": 1.3027826425374585e-05, "loss": 0.0066, "step": 176970 }, { "epoch": 1.91, "learning_rate": 1.3011610559771679e-05, "loss": 0.0065, "step": 176980 }, { "epoch": 1.91, "learning_rate": 1.2995394694168774e-05, "loss": 0.0061, "step": 176990 }, { "epoch": 1.91, "learning_rate": 1.2979178828565866e-05, "loss": 0.0084, "step": 177000 }, { "epoch": 1.91, "eval_cer": 0.9214921903908192, "eval_loss": 0.005274078343063593, "eval_runtime": 121.1903, "eval_samples_per_second": 16.503, "eval_steps_per_second": 4.126, "step": 177000 }, { "epoch": 1.91, "learning_rate": 1.296296296296296e-05, "loss": 0.0065, "step": 177010 }, { "epoch": 1.91, "learning_rate": 1.2946747097360055e-05, "loss": 0.0059, "step": 177020 }, { "epoch": 1.91, "learning_rate": 1.293053123175715e-05, "loss": 0.0064, "step": 177030 }, { "epoch": 1.91, "learning_rate": 1.2914315366154246e-05, "loss": 0.0056, "step": 177040 }, { "epoch": 1.91, "learning_rate": 1.2898099500551339e-05, "loss": 0.0076, "step": 177050 }, { "epoch": 1.91, "learning_rate": 1.2881883634948433e-05, "loss": 0.0058, "step": 177060 }, { "epoch": 1.91, "learning_rate": 1.2865667769345527e-05, "loss": 0.0061, "step": 177070 }, { "epoch": 1.91, "learning_rate": 1.2849451903742622e-05, "loss": 0.0048, "step": 177080 }, { "epoch": 1.91, "learning_rate": 1.2833236038139715e-05, "loss": 0.0056, "step": 177090 }, { "epoch": 1.91, "learning_rate": 1.2817020172536809e-05, "loss": 0.0059, "step": 177100 }, { "epoch": 1.91, "learning_rate": 1.2800804306933903e-05, "loss": 0.0075, "step": 177110 }, { "epoch": 1.91, "learning_rate": 1.2784588441330998e-05, "loss": 0.0058, "step": 177120 }, { "epoch": 1.91, "learning_rate": 1.276837257572809e-05, "loss": 0.0069, "step": 177130 }, { "epoch": 1.91, "learning_rate": 1.2752156710125185e-05, "loss": 0.0083, "step": 177140 }, { "epoch": 1.92, "learning_rate": 1.273594084452228e-05, "loss": 0.0057, "step": 177150 }, { "epoch": 1.92, "learning_rate": 1.2719724978919374e-05, "loss": 0.0066, "step": 177160 }, { "epoch": 1.92, "learning_rate": 1.2703509113316467e-05, "loss": 0.0081, "step": 177170 }, { "epoch": 1.92, "learning_rate": 1.2687293247713561e-05, "loss": 0.0069, "step": 177180 }, { "epoch": 1.92, "learning_rate": 1.2671077382110656e-05, "loss": 0.0072, "step": 177190 }, { "epoch": 1.92, "learning_rate": 1.265486151650775e-05, "loss": 0.0079, "step": 177200 }, { "epoch": 1.92, "learning_rate": 1.2638645650904843e-05, "loss": 0.0058, "step": 177210 }, { "epoch": 1.92, "learning_rate": 1.2622429785301939e-05, "loss": 0.0061, "step": 177220 }, { "epoch": 1.92, "learning_rate": 1.2606213919699033e-05, "loss": 0.0068, "step": 177230 }, { "epoch": 1.92, "learning_rate": 1.2589998054096128e-05, "loss": 0.0092, "step": 177240 }, { "epoch": 1.92, "learning_rate": 1.2573782188493222e-05, "loss": 0.006, "step": 177250 }, { "epoch": 1.92, "learning_rate": 1.2557566322890315e-05, "loss": 0.0059, "step": 177260 }, { "epoch": 1.92, "learning_rate": 1.254135045728741e-05, "loss": 0.0044, "step": 177270 }, { "epoch": 1.92, "learning_rate": 1.2525134591684504e-05, "loss": 0.0063, "step": 177280 }, { "epoch": 1.92, "learning_rate": 1.2508918726081597e-05, "loss": 0.0042, "step": 177290 }, { "epoch": 1.92, "learning_rate": 1.2492702860478691e-05, "loss": 0.0057, "step": 177300 }, { "epoch": 1.92, "learning_rate": 1.2476486994875785e-05, "loss": 0.0059, "step": 177310 }, { "epoch": 1.92, "learning_rate": 1.246027112927288e-05, "loss": 0.0069, "step": 177320 }, { "epoch": 1.92, "learning_rate": 1.2444055263669973e-05, "loss": 0.0102, "step": 177330 }, { "epoch": 1.92, "learning_rate": 1.2427839398067067e-05, "loss": 0.0068, "step": 177340 }, { "epoch": 1.92, "learning_rate": 1.2411623532464161e-05, "loss": 0.0062, "step": 177350 }, { "epoch": 1.92, "learning_rate": 1.2395407666861256e-05, "loss": 0.0073, "step": 177360 }, { "epoch": 1.92, "learning_rate": 1.2379191801258349e-05, "loss": 0.0072, "step": 177370 }, { "epoch": 1.92, "learning_rate": 1.2362975935655443e-05, "loss": 0.006, "step": 177380 }, { "epoch": 1.92, "learning_rate": 1.2346760070052538e-05, "loss": 0.0082, "step": 177390 }, { "epoch": 1.92, "learning_rate": 1.2330544204449634e-05, "loss": 0.0052, "step": 177400 }, { "epoch": 1.92, "learning_rate": 1.2314328338846728e-05, "loss": 0.0064, "step": 177410 }, { "epoch": 1.92, "learning_rate": 1.229811247324382e-05, "loss": 0.0061, "step": 177420 }, { "epoch": 1.92, "learning_rate": 1.2281896607640915e-05, "loss": 0.0077, "step": 177430 }, { "epoch": 1.92, "learning_rate": 1.226568074203801e-05, "loss": 0.0057, "step": 177440 }, { "epoch": 1.92, "learning_rate": 1.2249464876435104e-05, "loss": 0.005, "step": 177450 }, { "epoch": 1.92, "learning_rate": 1.2233249010832197e-05, "loss": 0.0077, "step": 177460 }, { "epoch": 1.92, "learning_rate": 1.2217033145229291e-05, "loss": 0.0066, "step": 177470 }, { "epoch": 1.92, "learning_rate": 1.2200817279626386e-05, "loss": 0.0054, "step": 177480 }, { "epoch": 1.92, "learning_rate": 1.218460141402348e-05, "loss": 0.0073, "step": 177490 }, { "epoch": 1.92, "learning_rate": 1.2168385548420573e-05, "loss": 0.0073, "step": 177500 }, { "epoch": 1.92, "learning_rate": 1.2152169682817667e-05, "loss": 0.0069, "step": 177510 }, { "epoch": 1.92, "learning_rate": 1.2135953817214762e-05, "loss": 0.0066, "step": 177520 }, { "epoch": 1.92, "learning_rate": 1.2119737951611856e-05, "loss": 0.0061, "step": 177530 }, { "epoch": 1.92, "learning_rate": 1.2103522086008949e-05, "loss": 0.0062, "step": 177540 }, { "epoch": 1.92, "learning_rate": 1.2087306220406043e-05, "loss": 0.008, "step": 177550 }, { "epoch": 1.92, "learning_rate": 1.2071090354803138e-05, "loss": 0.0053, "step": 177560 }, { "epoch": 1.92, "learning_rate": 1.2054874489200232e-05, "loss": 0.0067, "step": 177570 }, { "epoch": 1.92, "learning_rate": 1.2038658623597327e-05, "loss": 0.0073, "step": 177580 }, { "epoch": 1.92, "learning_rate": 1.2022442757994421e-05, "loss": 0.0048, "step": 177590 }, { "epoch": 1.92, "learning_rate": 1.2006226892391516e-05, "loss": 0.0044, "step": 177600 }, { "epoch": 1.92, "learning_rate": 1.199001102678861e-05, "loss": 0.0066, "step": 177610 }, { "epoch": 1.92, "learning_rate": 1.1973795161185703e-05, "loss": 0.0048, "step": 177620 }, { "epoch": 1.92, "learning_rate": 1.1957579295582797e-05, "loss": 0.0078, "step": 177630 }, { "epoch": 1.92, "learning_rate": 1.1941363429979892e-05, "loss": 0.0046, "step": 177640 }, { "epoch": 1.92, "learning_rate": 1.1925147564376986e-05, "loss": 0.006, "step": 177650 }, { "epoch": 1.92, "learning_rate": 1.1908931698774079e-05, "loss": 0.0055, "step": 177660 }, { "epoch": 1.92, "learning_rate": 1.1892715833171173e-05, "loss": 0.006, "step": 177670 }, { "epoch": 1.92, "learning_rate": 1.1876499967568268e-05, "loss": 0.0069, "step": 177680 }, { "epoch": 1.92, "learning_rate": 1.1860284101965362e-05, "loss": 0.0061, "step": 177690 }, { "epoch": 1.92, "learning_rate": 1.1844068236362455e-05, "loss": 0.009, "step": 177700 }, { "epoch": 1.92, "learning_rate": 1.182785237075955e-05, "loss": 0.0049, "step": 177710 }, { "epoch": 1.92, "learning_rate": 1.1811636505156644e-05, "loss": 0.0064, "step": 177720 }, { "epoch": 1.92, "learning_rate": 1.1795420639553738e-05, "loss": 0.0052, "step": 177730 }, { "epoch": 1.92, "learning_rate": 1.1779204773950831e-05, "loss": 0.0056, "step": 177740 }, { "epoch": 1.92, "learning_rate": 1.1762988908347925e-05, "loss": 0.0058, "step": 177750 }, { "epoch": 1.92, "learning_rate": 1.1746773042745022e-05, "loss": 0.0074, "step": 177760 }, { "epoch": 1.92, "learning_rate": 1.1730557177142116e-05, "loss": 0.008, "step": 177770 }, { "epoch": 1.92, "learning_rate": 1.171434131153921e-05, "loss": 0.0079, "step": 177780 }, { "epoch": 1.92, "learning_rate": 1.1698125445936303e-05, "loss": 0.0057, "step": 177790 }, { "epoch": 1.92, "learning_rate": 1.1681909580333398e-05, "loss": 0.0104, "step": 177800 }, { "epoch": 1.92, "learning_rate": 1.1665693714730492e-05, "loss": 0.0067, "step": 177810 }, { "epoch": 1.92, "learning_rate": 1.1649477849127586e-05, "loss": 0.006, "step": 177820 }, { "epoch": 1.92, "learning_rate": 1.163326198352468e-05, "loss": 0.0049, "step": 177830 }, { "epoch": 1.92, "learning_rate": 1.1617046117921774e-05, "loss": 0.0056, "step": 177840 }, { "epoch": 1.92, "learning_rate": 1.1600830252318868e-05, "loss": 0.0089, "step": 177850 }, { "epoch": 1.92, "learning_rate": 1.1584614386715963e-05, "loss": 0.0066, "step": 177860 }, { "epoch": 1.92, "learning_rate": 1.1568398521113055e-05, "loss": 0.0056, "step": 177870 }, { "epoch": 1.92, "learning_rate": 1.155218265551015e-05, "loss": 0.005, "step": 177880 }, { "epoch": 1.92, "learning_rate": 1.1535966789907244e-05, "loss": 0.0082, "step": 177890 }, { "epoch": 1.92, "learning_rate": 1.1519750924304337e-05, "loss": 0.005, "step": 177900 }, { "epoch": 1.92, "learning_rate": 1.1503535058701431e-05, "loss": 0.0083, "step": 177910 }, { "epoch": 1.92, "learning_rate": 1.1487319193098526e-05, "loss": 0.0074, "step": 177920 }, { "epoch": 1.92, "learning_rate": 1.147110332749562e-05, "loss": 0.0071, "step": 177930 }, { "epoch": 1.92, "learning_rate": 1.1454887461892716e-05, "loss": 0.0045, "step": 177940 }, { "epoch": 1.92, "learning_rate": 1.1438671596289809e-05, "loss": 0.0051, "step": 177950 }, { "epoch": 1.92, "learning_rate": 1.1422455730686904e-05, "loss": 0.0059, "step": 177960 }, { "epoch": 1.92, "learning_rate": 1.1406239865083998e-05, "loss": 0.0061, "step": 177970 }, { "epoch": 1.92, "learning_rate": 1.1390023999481092e-05, "loss": 0.0055, "step": 177980 }, { "epoch": 1.92, "learning_rate": 1.1373808133878185e-05, "loss": 0.0059, "step": 177990 }, { "epoch": 1.92, "learning_rate": 1.135759226827528e-05, "loss": 0.0066, "step": 178000 }, { "epoch": 1.92, "eval_cer": 0.9214965334056011, "eval_loss": 0.005222100764513016, "eval_runtime": 121.1363, "eval_samples_per_second": 16.51, "eval_steps_per_second": 4.128, "step": 178000 }, { "epoch": 1.92, "learning_rate": 1.1341376402672374e-05, "loss": 0.005, "step": 178010 }, { "epoch": 1.92, "learning_rate": 1.1325160537069468e-05, "loss": 0.0053, "step": 178020 }, { "epoch": 1.92, "learning_rate": 1.1308944671466561e-05, "loss": 0.0081, "step": 178030 }, { "epoch": 1.92, "learning_rate": 1.1292728805863656e-05, "loss": 0.0056, "step": 178040 }, { "epoch": 1.92, "learning_rate": 1.127651294026075e-05, "loss": 0.0064, "step": 178050 }, { "epoch": 1.92, "learning_rate": 1.1260297074657845e-05, "loss": 0.0057, "step": 178060 }, { "epoch": 1.93, "learning_rate": 1.1244081209054937e-05, "loss": 0.004, "step": 178070 }, { "epoch": 1.93, "learning_rate": 1.1227865343452032e-05, "loss": 0.0061, "step": 178080 }, { "epoch": 1.93, "learning_rate": 1.1211649477849126e-05, "loss": 0.0041, "step": 178090 }, { "epoch": 1.93, "learning_rate": 1.119543361224622e-05, "loss": 0.0051, "step": 178100 }, { "epoch": 1.93, "learning_rate": 1.1179217746643313e-05, "loss": 0.0057, "step": 178110 }, { "epoch": 1.93, "learning_rate": 1.116300188104041e-05, "loss": 0.0071, "step": 178120 }, { "epoch": 1.93, "learning_rate": 1.1146786015437504e-05, "loss": 0.0066, "step": 178130 }, { "epoch": 1.93, "learning_rate": 1.1130570149834598e-05, "loss": 0.0048, "step": 178140 }, { "epoch": 1.93, "learning_rate": 1.1114354284231693e-05, "loss": 0.0066, "step": 178150 }, { "epoch": 1.93, "learning_rate": 1.1098138418628785e-05, "loss": 0.0049, "step": 178160 }, { "epoch": 1.93, "learning_rate": 1.108192255302588e-05, "loss": 0.006, "step": 178170 }, { "epoch": 1.93, "learning_rate": 1.1065706687422974e-05, "loss": 0.0062, "step": 178180 }, { "epoch": 1.93, "learning_rate": 1.1049490821820069e-05, "loss": 0.0063, "step": 178190 }, { "epoch": 1.93, "learning_rate": 1.1033274956217162e-05, "loss": 0.0057, "step": 178200 }, { "epoch": 1.93, "learning_rate": 1.1017059090614256e-05, "loss": 0.0051, "step": 178210 }, { "epoch": 1.93, "learning_rate": 1.100084322501135e-05, "loss": 0.0037, "step": 178220 }, { "epoch": 1.93, "learning_rate": 1.0984627359408443e-05, "loss": 0.0053, "step": 178230 }, { "epoch": 1.93, "learning_rate": 1.0968411493805538e-05, "loss": 0.007, "step": 178240 }, { "epoch": 1.93, "learning_rate": 1.0952195628202632e-05, "loss": 0.0055, "step": 178250 }, { "epoch": 1.93, "learning_rate": 1.0935979762599726e-05, "loss": 0.0064, "step": 178260 }, { "epoch": 1.93, "learning_rate": 1.091976389699682e-05, "loss": 0.0048, "step": 178270 }, { "epoch": 1.93, "learning_rate": 1.0903548031393914e-05, "loss": 0.0062, "step": 178280 }, { "epoch": 1.93, "learning_rate": 1.0887332165791008e-05, "loss": 0.0082, "step": 178290 }, { "epoch": 1.93, "learning_rate": 1.0871116300188104e-05, "loss": 0.0059, "step": 178300 }, { "epoch": 1.93, "learning_rate": 1.0854900434585199e-05, "loss": 0.0059, "step": 178310 }, { "epoch": 1.93, "learning_rate": 1.0838684568982291e-05, "loss": 0.006, "step": 178320 }, { "epoch": 1.93, "learning_rate": 1.0822468703379386e-05, "loss": 0.006, "step": 178330 }, { "epoch": 1.93, "learning_rate": 1.080625283777648e-05, "loss": 0.0067, "step": 178340 }, { "epoch": 1.93, "learning_rate": 1.0790036972173575e-05, "loss": 0.0062, "step": 178350 }, { "epoch": 1.93, "learning_rate": 1.0773821106570667e-05, "loss": 0.0056, "step": 178360 }, { "epoch": 1.93, "learning_rate": 1.0757605240967762e-05, "loss": 0.0065, "step": 178370 }, { "epoch": 1.93, "learning_rate": 1.0741389375364856e-05, "loss": 0.0053, "step": 178380 }, { "epoch": 1.93, "learning_rate": 1.072517350976195e-05, "loss": 0.0057, "step": 178390 }, { "epoch": 1.93, "learning_rate": 1.0708957644159044e-05, "loss": 0.0066, "step": 178400 }, { "epoch": 1.93, "learning_rate": 1.0692741778556138e-05, "loss": 0.008, "step": 178410 }, { "epoch": 1.93, "learning_rate": 1.0676525912953232e-05, "loss": 0.0065, "step": 178420 }, { "epoch": 1.93, "learning_rate": 1.0660310047350327e-05, "loss": 0.0065, "step": 178430 }, { "epoch": 1.93, "learning_rate": 1.064409418174742e-05, "loss": 0.0061, "step": 178440 }, { "epoch": 1.93, "learning_rate": 1.0627878316144514e-05, "loss": 0.0061, "step": 178450 }, { "epoch": 1.93, "learning_rate": 1.0611662450541608e-05, "loss": 0.0047, "step": 178460 }, { "epoch": 1.93, "learning_rate": 1.0595446584938703e-05, "loss": 0.0078, "step": 178470 }, { "epoch": 1.93, "learning_rate": 1.0579230719335799e-05, "loss": 0.0068, "step": 178480 }, { "epoch": 1.93, "learning_rate": 1.0563014853732892e-05, "loss": 0.0042, "step": 178490 }, { "epoch": 1.93, "learning_rate": 1.0546798988129986e-05, "loss": 0.0086, "step": 178500 }, { "epoch": 1.93, "learning_rate": 1.053058312252708e-05, "loss": 0.0053, "step": 178510 }, { "epoch": 1.93, "learning_rate": 1.0514367256924173e-05, "loss": 0.0065, "step": 178520 }, { "epoch": 1.93, "learning_rate": 1.0498151391321268e-05, "loss": 0.0054, "step": 178530 }, { "epoch": 1.93, "learning_rate": 1.0481935525718362e-05, "loss": 0.0048, "step": 178540 }, { "epoch": 1.93, "learning_rate": 1.0465719660115457e-05, "loss": 0.006, "step": 178550 }, { "epoch": 1.93, "learning_rate": 1.044950379451255e-05, "loss": 0.0054, "step": 178560 }, { "epoch": 1.93, "learning_rate": 1.0433287928909644e-05, "loss": 0.0061, "step": 178570 }, { "epoch": 1.93, "learning_rate": 1.0417072063306738e-05, "loss": 0.0071, "step": 178580 }, { "epoch": 1.93, "learning_rate": 1.0400856197703833e-05, "loss": 0.0066, "step": 178590 }, { "epoch": 1.93, "learning_rate": 1.0384640332100926e-05, "loss": 0.0073, "step": 178600 }, { "epoch": 1.93, "learning_rate": 1.036842446649802e-05, "loss": 0.0061, "step": 178610 }, { "epoch": 1.93, "learning_rate": 1.0352208600895114e-05, "loss": 0.0048, "step": 178620 }, { "epoch": 1.93, "learning_rate": 1.0335992735292209e-05, "loss": 0.006, "step": 178630 }, { "epoch": 1.93, "learning_rate": 1.0319776869689302e-05, "loss": 0.0079, "step": 178640 }, { "epoch": 1.93, "learning_rate": 1.0303561004086396e-05, "loss": 0.0062, "step": 178650 }, { "epoch": 1.93, "learning_rate": 1.0287345138483492e-05, "loss": 0.0059, "step": 178660 }, { "epoch": 1.93, "learning_rate": 1.0271129272880587e-05, "loss": 0.0069, "step": 178670 }, { "epoch": 1.93, "learning_rate": 1.0254913407277681e-05, "loss": 0.0055, "step": 178680 }, { "epoch": 1.93, "learning_rate": 1.0238697541674774e-05, "loss": 0.005, "step": 178690 }, { "epoch": 1.93, "learning_rate": 1.0222481676071868e-05, "loss": 0.0051, "step": 178700 }, { "epoch": 1.93, "learning_rate": 1.0206265810468963e-05, "loss": 0.0049, "step": 178710 }, { "epoch": 1.93, "learning_rate": 1.0190049944866057e-05, "loss": 0.005, "step": 178720 }, { "epoch": 1.93, "learning_rate": 1.017383407926315e-05, "loss": 0.0088, "step": 178730 }, { "epoch": 1.93, "learning_rate": 1.0157618213660244e-05, "loss": 0.0074, "step": 178740 }, { "epoch": 1.93, "learning_rate": 1.0141402348057339e-05, "loss": 0.0055, "step": 178750 }, { "epoch": 1.93, "learning_rate": 1.0125186482454433e-05, "loss": 0.0062, "step": 178760 }, { "epoch": 1.93, "learning_rate": 1.0108970616851526e-05, "loss": 0.0092, "step": 178770 }, { "epoch": 1.93, "learning_rate": 1.009275475124862e-05, "loss": 0.0065, "step": 178780 }, { "epoch": 1.93, "learning_rate": 1.0076538885645715e-05, "loss": 0.0053, "step": 178790 }, { "epoch": 1.93, "learning_rate": 1.006032302004281e-05, "loss": 0.0072, "step": 178800 }, { "epoch": 1.93, "learning_rate": 1.0044107154439902e-05, "loss": 0.0064, "step": 178810 }, { "epoch": 1.93, "learning_rate": 1.0027891288836996e-05, "loss": 0.0056, "step": 178820 }, { "epoch": 1.93, "learning_rate": 1.001167542323409e-05, "loss": 0.006, "step": 178830 }, { "epoch": 1.93, "learning_rate": 9.995459557631187e-06, "loss": 0.0082, "step": 178840 }, { "epoch": 1.93, "learning_rate": 9.97924369202828e-06, "loss": 0.0056, "step": 178850 }, { "epoch": 1.93, "learning_rate": 9.963027826425374e-06, "loss": 0.0074, "step": 178860 }, { "epoch": 1.93, "learning_rate": 9.946811960822469e-06, "loss": 0.0065, "step": 178870 }, { "epoch": 1.93, "learning_rate": 9.930596095219563e-06, "loss": 0.0063, "step": 178880 }, { "epoch": 1.93, "learning_rate": 9.914380229616656e-06, "loss": 0.0061, "step": 178890 }, { "epoch": 1.93, "learning_rate": 9.89816436401375e-06, "loss": 0.004, "step": 178900 }, { "epoch": 1.93, "learning_rate": 9.881948498410845e-06, "loss": 0.0065, "step": 178910 }, { "epoch": 1.93, "learning_rate": 9.865732632807939e-06, "loss": 0.0053, "step": 178920 }, { "epoch": 1.93, "learning_rate": 9.849516767205032e-06, "loss": 0.007, "step": 178930 }, { "epoch": 1.93, "learning_rate": 9.833300901602126e-06, "loss": 0.0052, "step": 178940 }, { "epoch": 1.93, "learning_rate": 9.81708503599922e-06, "loss": 0.0076, "step": 178950 }, { "epoch": 1.93, "learning_rate": 9.800869170396315e-06, "loss": 0.0081, "step": 178960 }, { "epoch": 1.93, "learning_rate": 9.784653304793408e-06, "loss": 0.0069, "step": 178970 }, { "epoch": 1.93, "learning_rate": 9.768437439190502e-06, "loss": 0.0057, "step": 178980 }, { "epoch": 1.93, "learning_rate": 9.752221573587597e-06, "loss": 0.0069, "step": 178990 }, { "epoch": 1.94, "learning_rate": 9.736005707984691e-06, "loss": 0.0057, "step": 179000 }, { "epoch": 1.94, "eval_cer": 0.9215199856854233, "eval_loss": 0.005271059460937977, "eval_runtime": 121.1797, "eval_samples_per_second": 16.504, "eval_steps_per_second": 4.126, "step": 179000 }, { "epoch": 1.94, "learning_rate": 9.719789842381784e-06, "loss": 0.0054, "step": 179010 }, { "epoch": 1.94, "learning_rate": 9.70357397677888e-06, "loss": 0.0077, "step": 179020 }, { "epoch": 1.94, "learning_rate": 9.687358111175974e-06, "loss": 0.0062, "step": 179030 }, { "epoch": 1.94, "learning_rate": 9.671142245573069e-06, "loss": 0.0063, "step": 179040 }, { "epoch": 1.94, "learning_rate": 9.654926379970163e-06, "loss": 0.0062, "step": 179050 }, { "epoch": 1.94, "learning_rate": 9.638710514367256e-06, "loss": 0.0052, "step": 179060 }, { "epoch": 1.94, "learning_rate": 9.62249464876435e-06, "loss": 0.0045, "step": 179070 }, { "epoch": 1.94, "learning_rate": 9.606278783161445e-06, "loss": 0.0063, "step": 179080 }, { "epoch": 1.94, "learning_rate": 9.59006291755854e-06, "loss": 0.0073, "step": 179090 }, { "epoch": 1.94, "learning_rate": 9.573847051955632e-06, "loss": 0.0067, "step": 179100 }, { "epoch": 1.94, "learning_rate": 9.557631186352727e-06, "loss": 0.005, "step": 179110 }, { "epoch": 1.94, "learning_rate": 9.541415320749821e-06, "loss": 0.0045, "step": 179120 }, { "epoch": 1.94, "learning_rate": 9.525199455146915e-06, "loss": 0.0071, "step": 179130 }, { "epoch": 1.94, "learning_rate": 9.508983589544008e-06, "loss": 0.008, "step": 179140 }, { "epoch": 1.94, "learning_rate": 9.492767723941103e-06, "loss": 0.0053, "step": 179150 }, { "epoch": 1.94, "learning_rate": 9.476551858338197e-06, "loss": 0.0061, "step": 179160 }, { "epoch": 1.94, "learning_rate": 9.46033599273529e-06, "loss": 0.0056, "step": 179170 }, { "epoch": 1.94, "learning_rate": 9.444120127132384e-06, "loss": 0.0076, "step": 179180 }, { "epoch": 1.94, "learning_rate": 9.427904261529479e-06, "loss": 0.0068, "step": 179190 }, { "epoch": 1.94, "learning_rate": 9.411688395926575e-06, "loss": 0.0059, "step": 179200 }, { "epoch": 1.94, "learning_rate": 9.39547253032367e-06, "loss": 0.0081, "step": 179210 }, { "epoch": 1.94, "learning_rate": 9.379256664720762e-06, "loss": 0.007, "step": 179220 }, { "epoch": 1.94, "learning_rate": 9.363040799117856e-06, "loss": 0.0116, "step": 179230 }, { "epoch": 1.94, "learning_rate": 9.34682493351495e-06, "loss": 0.0063, "step": 179240 }, { "epoch": 1.94, "learning_rate": 9.330609067912045e-06, "loss": 0.0061, "step": 179250 }, { "epoch": 1.94, "learning_rate": 9.314393202309138e-06, "loss": 0.0046, "step": 179260 }, { "epoch": 1.94, "learning_rate": 9.298177336706232e-06, "loss": 0.0063, "step": 179270 }, { "epoch": 1.94, "learning_rate": 9.281961471103327e-06, "loss": 0.0054, "step": 179280 }, { "epoch": 1.94, "learning_rate": 9.265745605500421e-06, "loss": 0.0066, "step": 179290 }, { "epoch": 1.94, "learning_rate": 9.249529739897514e-06, "loss": 0.0069, "step": 179300 }, { "epoch": 1.94, "learning_rate": 9.233313874294609e-06, "loss": 0.0058, "step": 179310 }, { "epoch": 1.94, "learning_rate": 9.217098008691703e-06, "loss": 0.0078, "step": 179320 }, { "epoch": 1.94, "learning_rate": 9.200882143088797e-06, "loss": 0.0068, "step": 179330 }, { "epoch": 1.94, "learning_rate": 9.184666277485892e-06, "loss": 0.0074, "step": 179340 }, { "epoch": 1.94, "learning_rate": 9.168450411882986e-06, "loss": 0.005, "step": 179350 }, { "epoch": 1.94, "learning_rate": 9.152234546280079e-06, "loss": 0.0068, "step": 179360 }, { "epoch": 1.94, "learning_rate": 9.136018680677173e-06, "loss": 0.0071, "step": 179370 }, { "epoch": 1.94, "learning_rate": 9.119802815074268e-06, "loss": 0.0068, "step": 179380 }, { "epoch": 1.94, "learning_rate": 9.103586949471362e-06, "loss": 0.0082, "step": 179390 }, { "epoch": 1.94, "learning_rate": 9.087371083868455e-06, "loss": 0.0059, "step": 179400 }, { "epoch": 1.94, "learning_rate": 9.07115521826555e-06, "loss": 0.0068, "step": 179410 }, { "epoch": 1.94, "learning_rate": 9.054939352662644e-06, "loss": 0.0077, "step": 179420 }, { "epoch": 1.94, "learning_rate": 9.038723487059738e-06, "loss": 0.0086, "step": 179430 }, { "epoch": 1.94, "learning_rate": 9.022507621456833e-06, "loss": 0.0078, "step": 179440 }, { "epoch": 1.94, "learning_rate": 9.006291755853927e-06, "loss": 0.0067, "step": 179450 }, { "epoch": 1.94, "learning_rate": 8.990075890251022e-06, "loss": 0.0092, "step": 179460 }, { "epoch": 1.94, "learning_rate": 8.973860024648114e-06, "loss": 0.0074, "step": 179470 }, { "epoch": 1.94, "learning_rate": 8.957644159045209e-06, "loss": 0.0078, "step": 179480 }, { "epoch": 1.94, "learning_rate": 8.941428293442303e-06, "loss": 0.0079, "step": 179490 }, { "epoch": 1.94, "learning_rate": 8.925212427839396e-06, "loss": 0.0063, "step": 179500 }, { "epoch": 1.94, "learning_rate": 8.90899656223649e-06, "loss": 0.0081, "step": 179510 }, { "epoch": 1.94, "learning_rate": 8.892780696633587e-06, "loss": 0.0069, "step": 179520 }, { "epoch": 1.94, "learning_rate": 8.87656483103068e-06, "loss": 0.0074, "step": 179530 }, { "epoch": 1.94, "learning_rate": 8.860348965427774e-06, "loss": 0.0046, "step": 179540 }, { "epoch": 1.94, "learning_rate": 8.844133099824868e-06, "loss": 0.0072, "step": 179550 }, { "epoch": 1.94, "learning_rate": 8.827917234221963e-06, "loss": 0.006, "step": 179560 }, { "epoch": 1.94, "learning_rate": 8.811701368619055e-06, "loss": 0.0078, "step": 179570 }, { "epoch": 1.94, "learning_rate": 8.79548550301615e-06, "loss": 0.007, "step": 179580 }, { "epoch": 1.94, "learning_rate": 8.779269637413244e-06, "loss": 0.0072, "step": 179590 }, { "epoch": 1.94, "learning_rate": 8.763053771810339e-06, "loss": 0.0061, "step": 179600 }, { "epoch": 1.94, "learning_rate": 8.746837906207433e-06, "loss": 0.0044, "step": 179610 }, { "epoch": 1.94, "learning_rate": 8.730622040604528e-06, "loss": 0.0065, "step": 179620 }, { "epoch": 1.94, "learning_rate": 8.71440617500162e-06, "loss": 0.0042, "step": 179630 }, { "epoch": 1.94, "learning_rate": 8.698190309398715e-06, "loss": 0.0079, "step": 179640 }, { "epoch": 1.94, "learning_rate": 8.68197444379581e-06, "loss": 0.005, "step": 179650 }, { "epoch": 1.94, "learning_rate": 8.665758578192904e-06, "loss": 0.0086, "step": 179660 }, { "epoch": 1.94, "learning_rate": 8.649542712589996e-06, "loss": 0.005, "step": 179670 }, { "epoch": 1.94, "learning_rate": 8.633326846987091e-06, "loss": 0.006, "step": 179680 }, { "epoch": 1.94, "learning_rate": 8.617110981384185e-06, "loss": 0.0063, "step": 179690 }, { "epoch": 1.94, "learning_rate": 8.60089511578128e-06, "loss": 0.006, "step": 179700 }, { "epoch": 1.94, "learning_rate": 8.584679250178374e-06, "loss": 0.0059, "step": 179710 }, { "epoch": 1.94, "learning_rate": 8.568463384575469e-06, "loss": 0.006, "step": 179720 }, { "epoch": 1.94, "learning_rate": 8.552247518972561e-06, "loss": 0.0062, "step": 179730 }, { "epoch": 1.94, "learning_rate": 8.536031653369656e-06, "loss": 0.0063, "step": 179740 }, { "epoch": 1.94, "learning_rate": 8.51981578776675e-06, "loss": 0.0062, "step": 179750 }, { "epoch": 1.94, "learning_rate": 8.503599922163845e-06, "loss": 0.0055, "step": 179760 }, { "epoch": 1.94, "learning_rate": 8.487384056560937e-06, "loss": 0.0075, "step": 179770 }, { "epoch": 1.94, "learning_rate": 8.471168190958032e-06, "loss": 0.0051, "step": 179780 }, { "epoch": 1.94, "learning_rate": 8.454952325355126e-06, "loss": 0.0064, "step": 179790 }, { "epoch": 1.94, "learning_rate": 8.43873645975222e-06, "loss": 0.0065, "step": 179800 }, { "epoch": 1.94, "learning_rate": 8.422520594149315e-06, "loss": 0.0073, "step": 179810 }, { "epoch": 1.94, "learning_rate": 8.40630472854641e-06, "loss": 0.0064, "step": 179820 }, { "epoch": 1.94, "learning_rate": 8.390088862943502e-06, "loss": 0.0066, "step": 179830 }, { "epoch": 1.94, "learning_rate": 8.373872997340597e-06, "loss": 0.0069, "step": 179840 }, { "epoch": 1.94, "learning_rate": 8.357657131737691e-06, "loss": 0.0067, "step": 179850 }, { "epoch": 1.94, "learning_rate": 8.341441266134786e-06, "loss": 0.0046, "step": 179860 }, { "epoch": 1.94, "learning_rate": 8.32522540053188e-06, "loss": 0.0071, "step": 179870 }, { "epoch": 1.94, "learning_rate": 8.309009534928975e-06, "loss": 0.0073, "step": 179880 }, { "epoch": 1.94, "learning_rate": 8.292793669326069e-06, "loss": 0.0046, "step": 179890 }, { "epoch": 1.94, "learning_rate": 8.276577803723162e-06, "loss": 0.0061, "step": 179900 }, { "epoch": 1.94, "learning_rate": 8.260361938120256e-06, "loss": 0.0065, "step": 179910 }, { "epoch": 1.95, "learning_rate": 8.24414607251735e-06, "loss": 0.0068, "step": 179920 }, { "epoch": 1.95, "learning_rate": 8.227930206914445e-06, "loss": 0.0046, "step": 179930 }, { "epoch": 1.95, "learning_rate": 8.211714341311538e-06, "loss": 0.0059, "step": 179940 }, { "epoch": 1.95, "learning_rate": 8.195498475708632e-06, "loss": 0.0051, "step": 179950 }, { "epoch": 1.95, "learning_rate": 8.179282610105727e-06, "loss": 0.0061, "step": 179960 }, { "epoch": 1.95, "learning_rate": 8.163066744502821e-06, "loss": 0.0057, "step": 179970 }, { "epoch": 1.95, "learning_rate": 8.146850878899916e-06, "loss": 0.0101, "step": 179980 }, { "epoch": 1.95, "learning_rate": 8.13063501329701e-06, "loss": 0.0077, "step": 179990 }, { "epoch": 1.95, "learning_rate": 8.114419147694103e-06, "loss": 0.0059, "step": 180000 }, { "epoch": 1.95, "eval_cer": 0.9215034822292522, "eval_loss": 0.005232350900769234, "eval_runtime": 121.4858, "eval_samples_per_second": 16.463, "eval_steps_per_second": 4.116, "step": 180000 }, { "epoch": 1.95, "learning_rate": 8.098203282091197e-06, "loss": 0.0068, "step": 180010 }, { "epoch": 1.95, "learning_rate": 8.081987416488292e-06, "loss": 0.0064, "step": 180020 }, { "epoch": 1.95, "learning_rate": 8.065771550885386e-06, "loss": 0.0055, "step": 180030 }, { "epoch": 1.95, "learning_rate": 8.049555685282479e-06, "loss": 0.0043, "step": 180040 }, { "epoch": 1.95, "learning_rate": 8.033339819679575e-06, "loss": 0.0072, "step": 180050 }, { "epoch": 1.95, "learning_rate": 8.017123954076668e-06, "loss": 0.007, "step": 180060 }, { "epoch": 1.95, "learning_rate": 8.000908088473762e-06, "loss": 0.0051, "step": 180070 }, { "epoch": 1.95, "learning_rate": 7.984692222870857e-06, "loss": 0.0067, "step": 180080 }, { "epoch": 1.95, "learning_rate": 7.968476357267951e-06, "loss": 0.0065, "step": 180090 }, { "epoch": 1.95, "learning_rate": 7.952260491665044e-06, "loss": 0.0061, "step": 180100 }, { "epoch": 1.95, "learning_rate": 7.936044626062138e-06, "loss": 0.0049, "step": 180110 }, { "epoch": 1.95, "learning_rate": 7.919828760459233e-06, "loss": 0.0055, "step": 180120 }, { "epoch": 1.95, "learning_rate": 7.903612894856327e-06, "loss": 0.0064, "step": 180130 }, { "epoch": 1.95, "learning_rate": 7.887397029253421e-06, "loss": 0.0056, "step": 180140 }, { "epoch": 1.95, "learning_rate": 7.871181163650516e-06, "loss": 0.0092, "step": 180150 }, { "epoch": 1.95, "learning_rate": 7.854965298047609e-06, "loss": 0.0049, "step": 180160 }, { "epoch": 1.95, "learning_rate": 7.838749432444703e-06, "loss": 0.0065, "step": 180170 }, { "epoch": 1.95, "learning_rate": 7.822533566841798e-06, "loss": 0.0092, "step": 180180 }, { "epoch": 1.95, "learning_rate": 7.806317701238892e-06, "loss": 0.005, "step": 180190 }, { "epoch": 1.95, "learning_rate": 7.790101835635985e-06, "loss": 0.0077, "step": 180200 }, { "epoch": 1.95, "learning_rate": 7.773885970033079e-06, "loss": 0.0064, "step": 180210 }, { "epoch": 1.95, "learning_rate": 7.757670104430174e-06, "loss": 0.0057, "step": 180220 }, { "epoch": 1.95, "learning_rate": 7.741454238827268e-06, "loss": 0.0056, "step": 180230 }, { "epoch": 1.95, "learning_rate": 7.725238373224362e-06, "loss": 0.004, "step": 180240 }, { "epoch": 1.95, "learning_rate": 7.709022507621457e-06, "loss": 0.0053, "step": 180250 }, { "epoch": 1.95, "learning_rate": 7.69280664201855e-06, "loss": 0.0066, "step": 180260 }, { "epoch": 1.95, "learning_rate": 7.676590776415644e-06, "loss": 0.005, "step": 180270 }, { "epoch": 1.95, "learning_rate": 7.660374910812738e-06, "loss": 0.0069, "step": 180280 }, { "epoch": 1.95, "learning_rate": 7.644159045209833e-06, "loss": 0.0049, "step": 180290 }, { "epoch": 1.95, "learning_rate": 7.6279431796069265e-06, "loss": 0.0046, "step": 180300 }, { "epoch": 1.95, "learning_rate": 7.61172731400402e-06, "loss": 0.0071, "step": 180310 }, { "epoch": 1.95, "learning_rate": 7.595511448401115e-06, "loss": 0.0047, "step": 180320 }, { "epoch": 1.95, "learning_rate": 7.57929558279821e-06, "loss": 0.0064, "step": 180330 }, { "epoch": 1.95, "learning_rate": 7.563079717195303e-06, "loss": 0.0077, "step": 180340 }, { "epoch": 1.95, "learning_rate": 7.546863851592398e-06, "loss": 0.0051, "step": 180350 }, { "epoch": 1.95, "learning_rate": 7.5306479859894914e-06, "loss": 0.0044, "step": 180360 }, { "epoch": 1.95, "learning_rate": 7.514432120386586e-06, "loss": 0.0073, "step": 180370 }, { "epoch": 1.95, "learning_rate": 7.4982162547836795e-06, "loss": 0.0074, "step": 180380 }, { "epoch": 1.95, "learning_rate": 7.482000389180774e-06, "loss": 0.0094, "step": 180390 }, { "epoch": 1.95, "learning_rate": 7.4657845235778675e-06, "loss": 0.0053, "step": 180400 }, { "epoch": 1.95, "learning_rate": 7.449568657974963e-06, "loss": 0.0053, "step": 180410 }, { "epoch": 1.95, "learning_rate": 7.433352792372056e-06, "loss": 0.0066, "step": 180420 }, { "epoch": 1.95, "learning_rate": 7.417136926769151e-06, "loss": 0.0068, "step": 180430 }, { "epoch": 1.95, "learning_rate": 7.400921061166244e-06, "loss": 0.0075, "step": 180440 }, { "epoch": 1.95, "learning_rate": 7.384705195563339e-06, "loss": 0.0055, "step": 180450 }, { "epoch": 1.95, "learning_rate": 7.3684893299604324e-06, "loss": 0.0041, "step": 180460 }, { "epoch": 1.95, "learning_rate": 7.352273464357527e-06, "loss": 0.0055, "step": 180470 }, { "epoch": 1.95, "learning_rate": 7.3360575987546205e-06, "loss": 0.0047, "step": 180480 }, { "epoch": 1.95, "learning_rate": 7.319841733151715e-06, "loss": 0.0046, "step": 180490 }, { "epoch": 1.95, "learning_rate": 7.303625867548809e-06, "loss": 0.0096, "step": 180500 }, { "epoch": 1.95, "learning_rate": 7.287410001945904e-06, "loss": 0.0063, "step": 180510 }, { "epoch": 1.95, "learning_rate": 7.271194136342997e-06, "loss": 0.0042, "step": 180520 }, { "epoch": 1.95, "learning_rate": 7.254978270740092e-06, "loss": 0.0054, "step": 180530 }, { "epoch": 1.95, "learning_rate": 7.238762405137185e-06, "loss": 0.0065, "step": 180540 }, { "epoch": 1.95, "learning_rate": 7.22254653953428e-06, "loss": 0.0054, "step": 180550 }, { "epoch": 1.95, "learning_rate": 7.206330673931373e-06, "loss": 0.0071, "step": 180560 }, { "epoch": 1.95, "learning_rate": 7.190114808328468e-06, "loss": 0.0093, "step": 180570 }, { "epoch": 1.95, "learning_rate": 7.1738989427255615e-06, "loss": 0.0063, "step": 180580 }, { "epoch": 1.95, "learning_rate": 7.157683077122657e-06, "loss": 0.008, "step": 180590 }, { "epoch": 1.95, "learning_rate": 7.14146721151975e-06, "loss": 0.006, "step": 180600 }, { "epoch": 1.95, "learning_rate": 7.125251345916845e-06, "loss": 0.0061, "step": 180610 }, { "epoch": 1.95, "learning_rate": 7.109035480313938e-06, "loss": 0.006, "step": 180620 }, { "epoch": 1.95, "learning_rate": 7.092819614711033e-06, "loss": 0.0063, "step": 180630 }, { "epoch": 1.95, "learning_rate": 7.076603749108126e-06, "loss": 0.0068, "step": 180640 }, { "epoch": 1.95, "learning_rate": 7.060387883505221e-06, "loss": 0.0068, "step": 180650 }, { "epoch": 1.95, "learning_rate": 7.044172017902314e-06, "loss": 0.0059, "step": 180660 }, { "epoch": 1.95, "learning_rate": 7.027956152299409e-06, "loss": 0.0053, "step": 180670 }, { "epoch": 1.95, "learning_rate": 7.011740286696504e-06, "loss": 0.0051, "step": 180680 }, { "epoch": 1.95, "learning_rate": 6.995524421093598e-06, "loss": 0.0074, "step": 180690 }, { "epoch": 1.95, "learning_rate": 6.979308555490692e-06, "loss": 0.0062, "step": 180700 }, { "epoch": 1.95, "learning_rate": 6.963092689887786e-06, "loss": 0.0072, "step": 180710 }, { "epoch": 1.95, "learning_rate": 6.94687682428488e-06, "loss": 0.005, "step": 180720 }, { "epoch": 1.95, "learning_rate": 6.930660958681974e-06, "loss": 0.0067, "step": 180730 }, { "epoch": 1.95, "learning_rate": 6.914445093079067e-06, "loss": 0.0057, "step": 180740 }, { "epoch": 1.95, "learning_rate": 6.898229227476162e-06, "loss": 0.0066, "step": 180750 }, { "epoch": 1.95, "learning_rate": 6.882013361873255e-06, "loss": 0.0061, "step": 180760 }, { "epoch": 1.95, "learning_rate": 6.865797496270351e-06, "loss": 0.0058, "step": 180770 }, { "epoch": 1.95, "learning_rate": 6.849581630667445e-06, "loss": 0.006, "step": 180780 }, { "epoch": 1.95, "learning_rate": 6.833365765064539e-06, "loss": 0.0049, "step": 180790 }, { "epoch": 1.95, "learning_rate": 6.817149899461633e-06, "loss": 0.0051, "step": 180800 }, { "epoch": 1.95, "learning_rate": 6.800934033858727e-06, "loss": 0.0071, "step": 180810 }, { "epoch": 1.95, "learning_rate": 6.784718168255821e-06, "loss": 0.0075, "step": 180820 }, { "epoch": 1.95, "learning_rate": 6.768502302652915e-06, "loss": 0.0074, "step": 180830 }, { "epoch": 1.95, "learning_rate": 6.752286437050009e-06, "loss": 0.0061, "step": 180840 }, { "epoch": 1.96, "learning_rate": 6.736070571447103e-06, "loss": 0.0068, "step": 180850 }, { "epoch": 1.96, "learning_rate": 6.719854705844198e-06, "loss": 0.0057, "step": 180860 }, { "epoch": 1.96, "learning_rate": 6.703638840241292e-06, "loss": 0.0062, "step": 180870 }, { "epoch": 1.96, "learning_rate": 6.687422974638386e-06, "loss": 0.0042, "step": 180880 }, { "epoch": 1.96, "learning_rate": 6.67120710903548e-06, "loss": 0.0051, "step": 180890 }, { "epoch": 1.96, "learning_rate": 6.654991243432574e-06, "loss": 0.0065, "step": 180900 }, { "epoch": 1.96, "learning_rate": 6.638775377829668e-06, "loss": 0.0063, "step": 180910 }, { "epoch": 1.96, "learning_rate": 6.622559512226762e-06, "loss": 0.0064, "step": 180920 }, { "epoch": 1.96, "learning_rate": 6.606343646623856e-06, "loss": 0.0052, "step": 180930 }, { "epoch": 1.96, "learning_rate": 6.59012778102095e-06, "loss": 0.0054, "step": 180940 }, { "epoch": 1.96, "learning_rate": 6.573911915418045e-06, "loss": 0.0101, "step": 180950 }, { "epoch": 1.96, "learning_rate": 6.557696049815139e-06, "loss": 0.0064, "step": 180960 }, { "epoch": 1.96, "learning_rate": 6.541480184212233e-06, "loss": 0.005, "step": 180970 }, { "epoch": 1.96, "learning_rate": 6.525264318609327e-06, "loss": 0.0043, "step": 180980 }, { "epoch": 1.96, "learning_rate": 6.509048453006421e-06, "loss": 0.0058, "step": 180990 }, { "epoch": 1.96, "learning_rate": 6.492832587403515e-06, "loss": 0.0053, "step": 181000 }, { "epoch": 1.96, "eval_cer": 0.921500876420383, "eval_loss": 0.005276523530483246, "eval_runtime": 121.2902, "eval_samples_per_second": 16.489, "eval_steps_per_second": 4.122, "step": 181000 }, { "epoch": 1.96, "learning_rate": 6.476616721800609e-06, "loss": 0.0058, "step": 181010 }, { "epoch": 1.96, "learning_rate": 6.460400856197703e-06, "loss": 0.0084, "step": 181020 }, { "epoch": 1.96, "learning_rate": 6.444184990594797e-06, "loss": 0.0088, "step": 181030 }, { "epoch": 1.96, "learning_rate": 6.427969124991892e-06, "loss": 0.0085, "step": 181040 }, { "epoch": 1.96, "learning_rate": 6.411753259388986e-06, "loss": 0.0054, "step": 181050 }, { "epoch": 1.96, "learning_rate": 6.39553739378608e-06, "loss": 0.0054, "step": 181060 }, { "epoch": 1.96, "learning_rate": 6.379321528183174e-06, "loss": 0.0084, "step": 181070 }, { "epoch": 1.96, "learning_rate": 6.363105662580268e-06, "loss": 0.0073, "step": 181080 }, { "epoch": 1.96, "learning_rate": 6.346889796977362e-06, "loss": 0.0047, "step": 181090 }, { "epoch": 1.96, "learning_rate": 6.330673931374456e-06, "loss": 0.0077, "step": 181100 }, { "epoch": 1.96, "learning_rate": 6.31445806577155e-06, "loss": 0.0062, "step": 181110 }, { "epoch": 1.96, "learning_rate": 6.298242200168644e-06, "loss": 0.0064, "step": 181120 }, { "epoch": 1.96, "learning_rate": 6.282026334565739e-06, "loss": 0.0053, "step": 181130 }, { "epoch": 1.96, "learning_rate": 6.265810468962833e-06, "loss": 0.0069, "step": 181140 }, { "epoch": 1.96, "learning_rate": 6.2495946033599274e-06, "loss": 0.006, "step": 181150 }, { "epoch": 1.96, "learning_rate": 6.233378737757021e-06, "loss": 0.0062, "step": 181160 }, { "epoch": 1.96, "learning_rate": 6.2171628721541155e-06, "loss": 0.0052, "step": 181170 }, { "epoch": 1.96, "learning_rate": 6.200947006551209e-06, "loss": 0.0048, "step": 181180 }, { "epoch": 1.96, "learning_rate": 6.1847311409483035e-06, "loss": 0.0082, "step": 181190 }, { "epoch": 1.96, "learning_rate": 6.168515275345397e-06, "loss": 0.0044, "step": 181200 }, { "epoch": 1.96, "learning_rate": 6.152299409742491e-06, "loss": 0.0051, "step": 181210 }, { "epoch": 1.96, "learning_rate": 6.136083544139586e-06, "loss": 0.0053, "step": 181220 }, { "epoch": 1.96, "learning_rate": 6.11986767853668e-06, "loss": 0.0073, "step": 181230 }, { "epoch": 1.96, "learning_rate": 6.103651812933774e-06, "loss": 0.006, "step": 181240 }, { "epoch": 1.96, "learning_rate": 6.0874359473308684e-06, "loss": 0.0071, "step": 181250 }, { "epoch": 1.96, "learning_rate": 6.071220081727962e-06, "loss": 0.0062, "step": 181260 }, { "epoch": 1.96, "learning_rate": 6.0550042161250565e-06, "loss": 0.0059, "step": 181270 }, { "epoch": 1.96, "learning_rate": 6.03878835052215e-06, "loss": 0.0079, "step": 181280 }, { "epoch": 1.96, "learning_rate": 6.0225724849192445e-06, "loss": 0.0057, "step": 181290 }, { "epoch": 1.96, "learning_rate": 6.006356619316338e-06, "loss": 0.0077, "step": 181300 }, { "epoch": 1.96, "learning_rate": 5.990140753713433e-06, "loss": 0.0067, "step": 181310 }, { "epoch": 1.96, "learning_rate": 5.973924888110527e-06, "loss": 0.0069, "step": 181320 }, { "epoch": 1.96, "learning_rate": 5.957709022507621e-06, "loss": 0.006, "step": 181330 }, { "epoch": 1.96, "learning_rate": 5.941493156904715e-06, "loss": 0.0053, "step": 181340 }, { "epoch": 1.96, "learning_rate": 5.925277291301809e-06, "loss": 0.0064, "step": 181350 }, { "epoch": 1.96, "learning_rate": 5.909061425698903e-06, "loss": 0.0059, "step": 181360 }, { "epoch": 1.96, "learning_rate": 5.8928455600959975e-06, "loss": 0.0059, "step": 181370 }, { "epoch": 1.96, "learning_rate": 5.876629694493091e-06, "loss": 0.0051, "step": 181380 }, { "epoch": 1.96, "learning_rate": 5.8604138288901855e-06, "loss": 0.0048, "step": 181390 }, { "epoch": 1.96, "learning_rate": 5.84419796328728e-06, "loss": 0.0052, "step": 181400 }, { "epoch": 1.96, "learning_rate": 5.827982097684374e-06, "loss": 0.0042, "step": 181410 }, { "epoch": 1.96, "learning_rate": 5.811766232081468e-06, "loss": 0.0077, "step": 181420 }, { "epoch": 1.96, "learning_rate": 5.795550366478562e-06, "loss": 0.0064, "step": 181430 }, { "epoch": 1.96, "learning_rate": 5.779334500875656e-06, "loss": 0.0064, "step": 181440 }, { "epoch": 1.96, "learning_rate": 5.76311863527275e-06, "loss": 0.006, "step": 181450 }, { "epoch": 1.96, "learning_rate": 5.746902769669844e-06, "loss": 0.0048, "step": 181460 }, { "epoch": 1.96, "learning_rate": 5.7306869040669384e-06, "loss": 0.0061, "step": 181470 }, { "epoch": 1.96, "learning_rate": 5.714471038464032e-06, "loss": 0.0076, "step": 181480 }, { "epoch": 1.96, "learning_rate": 5.698255172861127e-06, "loss": 0.0037, "step": 181490 }, { "epoch": 1.96, "learning_rate": 5.682039307258222e-06, "loss": 0.005, "step": 181500 }, { "epoch": 1.96, "learning_rate": 5.665823441655315e-06, "loss": 0.008, "step": 181510 }, { "epoch": 1.96, "learning_rate": 5.649607576052409e-06, "loss": 0.0071, "step": 181520 }, { "epoch": 1.96, "learning_rate": 5.633391710449503e-06, "loss": 0.007, "step": 181530 }, { "epoch": 1.96, "learning_rate": 5.617175844846597e-06, "loss": 0.0063, "step": 181540 }, { "epoch": 1.96, "learning_rate": 5.600959979243691e-06, "loss": 0.0046, "step": 181550 }, { "epoch": 1.96, "learning_rate": 5.584744113640785e-06, "loss": 0.0068, "step": 181560 }, { "epoch": 1.96, "learning_rate": 5.5685282480378794e-06, "loss": 0.0054, "step": 181570 }, { "epoch": 1.96, "learning_rate": 5.552312382434975e-06, "loss": 0.0085, "step": 181580 }, { "epoch": 1.96, "learning_rate": 5.536096516832068e-06, "loss": 0.0052, "step": 181590 }, { "epoch": 1.96, "learning_rate": 5.519880651229163e-06, "loss": 0.005, "step": 181600 }, { "epoch": 1.96, "learning_rate": 5.503664785626256e-06, "loss": 0.0067, "step": 181610 }, { "epoch": 1.96, "learning_rate": 5.487448920023351e-06, "loss": 0.006, "step": 181620 }, { "epoch": 1.96, "learning_rate": 5.471233054420444e-06, "loss": 0.0052, "step": 181630 }, { "epoch": 1.96, "learning_rate": 5.455017188817539e-06, "loss": 0.0074, "step": 181640 }, { "epoch": 1.96, "learning_rate": 5.438801323214632e-06, "loss": 0.0064, "step": 181650 }, { "epoch": 1.96, "learning_rate": 5.422585457611727e-06, "loss": 0.0057, "step": 181660 }, { "epoch": 1.96, "learning_rate": 5.406369592008821e-06, "loss": 0.006, "step": 181670 }, { "epoch": 1.96, "learning_rate": 5.390153726405916e-06, "loss": 0.005, "step": 181680 }, { "epoch": 1.96, "learning_rate": 5.373937860803009e-06, "loss": 0.0049, "step": 181690 }, { "epoch": 1.96, "learning_rate": 5.357721995200104e-06, "loss": 0.0046, "step": 181700 }, { "epoch": 1.96, "learning_rate": 5.341506129597197e-06, "loss": 0.0067, "step": 181710 }, { "epoch": 1.96, "learning_rate": 5.325290263994292e-06, "loss": 0.0044, "step": 181720 }, { "epoch": 1.96, "learning_rate": 5.309074398391385e-06, "loss": 0.0059, "step": 181730 }, { "epoch": 1.96, "learning_rate": 5.29285853278848e-06, "loss": 0.006, "step": 181740 }, { "epoch": 1.96, "learning_rate": 5.276642667185573e-06, "loss": 0.0093, "step": 181750 }, { "epoch": 1.96, "learning_rate": 5.260426801582669e-06, "loss": 0.0063, "step": 181760 }, { "epoch": 1.97, "learning_rate": 5.244210935979762e-06, "loss": 0.0066, "step": 181770 }, { "epoch": 1.97, "learning_rate": 5.227995070376857e-06, "loss": 0.005, "step": 181780 }, { "epoch": 1.97, "learning_rate": 5.21177920477395e-06, "loss": 0.0048, "step": 181790 }, { "epoch": 1.97, "learning_rate": 5.195563339171045e-06, "loss": 0.0084, "step": 181800 }, { "epoch": 1.97, "learning_rate": 5.179347473568138e-06, "loss": 0.006, "step": 181810 }, { "epoch": 1.97, "learning_rate": 5.163131607965233e-06, "loss": 0.0066, "step": 181820 }, { "epoch": 1.97, "learning_rate": 5.146915742362326e-06, "loss": 0.0061, "step": 181830 }, { "epoch": 1.97, "learning_rate": 5.130699876759421e-06, "loss": 0.0052, "step": 181840 }, { "epoch": 1.97, "learning_rate": 5.114484011156515e-06, "loss": 0.0051, "step": 181850 }, { "epoch": 1.97, "learning_rate": 5.09826814555361e-06, "loss": 0.0081, "step": 181860 }, { "epoch": 1.97, "learning_rate": 5.082052279950703e-06, "loss": 0.0062, "step": 181870 }, { "epoch": 1.97, "learning_rate": 5.065836414347798e-06, "loss": 0.0062, "step": 181880 }, { "epoch": 1.97, "learning_rate": 5.049620548744891e-06, "loss": 0.0072, "step": 181890 }, { "epoch": 1.97, "learning_rate": 5.033404683141986e-06, "loss": 0.0045, "step": 181900 }, { "epoch": 1.97, "learning_rate": 5.017188817539079e-06, "loss": 0.0087, "step": 181910 }, { "epoch": 1.97, "learning_rate": 5.000972951936174e-06, "loss": 0.0053, "step": 181920 }, { "epoch": 1.97, "learning_rate": 4.984757086333267e-06, "loss": 0.0049, "step": 181930 }, { "epoch": 1.97, "learning_rate": 4.968541220730363e-06, "loss": 0.0054, "step": 181940 }, { "epoch": 1.97, "learning_rate": 4.952325355127457e-06, "loss": 0.004, "step": 181950 }, { "epoch": 1.97, "learning_rate": 4.936109489524551e-06, "loss": 0.0062, "step": 181960 }, { "epoch": 1.97, "learning_rate": 4.919893623921645e-06, "loss": 0.0061, "step": 181970 }, { "epoch": 1.97, "learning_rate": 4.903677758318739e-06, "loss": 0.006, "step": 181980 }, { "epoch": 1.97, "learning_rate": 4.887461892715832e-06, "loss": 0.0044, "step": 181990 }, { "epoch": 1.97, "learning_rate": 4.871246027112927e-06, "loss": 0.0056, "step": 182000 }, { "epoch": 1.97, "eval_cer": 0.9215017450233394, "eval_loss": 0.0052335127256810665, "eval_runtime": 121.2359, "eval_samples_per_second": 16.497, "eval_steps_per_second": 4.124, "step": 182000 }, { "epoch": 1.97, "learning_rate": 4.85503016151002e-06, "loss": 0.0057, "step": 182010 }, { "epoch": 1.97, "learning_rate": 4.838814295907115e-06, "loss": 0.0073, "step": 182020 }, { "epoch": 1.97, "learning_rate": 4.82259843030421e-06, "loss": 0.0076, "step": 182030 }, { "epoch": 1.97, "learning_rate": 4.806382564701304e-06, "loss": 0.0061, "step": 182040 }, { "epoch": 1.97, "learning_rate": 4.790166699098398e-06, "loss": 0.0052, "step": 182050 }, { "epoch": 1.97, "learning_rate": 4.773950833495492e-06, "loss": 0.004, "step": 182060 }, { "epoch": 1.97, "learning_rate": 4.757734967892586e-06, "loss": 0.0063, "step": 182070 }, { "epoch": 1.97, "learning_rate": 4.74151910228968e-06, "loss": 0.0052, "step": 182080 }, { "epoch": 1.97, "learning_rate": 4.725303236686774e-06, "loss": 0.0059, "step": 182090 }, { "epoch": 1.97, "learning_rate": 4.709087371083868e-06, "loss": 0.0073, "step": 182100 }, { "epoch": 1.97, "learning_rate": 4.692871505480962e-06, "loss": 0.0081, "step": 182110 }, { "epoch": 1.97, "learning_rate": 4.6766556398780565e-06, "loss": 0.007, "step": 182120 }, { "epoch": 1.97, "learning_rate": 4.66043977427515e-06, "loss": 0.0053, "step": 182130 }, { "epoch": 1.97, "learning_rate": 4.6442239086722446e-06, "loss": 0.0049, "step": 182140 }, { "epoch": 1.97, "learning_rate": 4.628008043069339e-06, "loss": 0.0059, "step": 182150 }, { "epoch": 1.97, "learning_rate": 4.611792177466433e-06, "loss": 0.0067, "step": 182160 }, { "epoch": 1.97, "learning_rate": 4.595576311863527e-06, "loss": 0.0053, "step": 182170 }, { "epoch": 1.97, "learning_rate": 4.579360446260621e-06, "loss": 0.0083, "step": 182180 }, { "epoch": 1.97, "learning_rate": 4.563144580657715e-06, "loss": 0.0058, "step": 182190 }, { "epoch": 1.97, "learning_rate": 4.5469287150548095e-06, "loss": 0.0048, "step": 182200 }, { "epoch": 1.97, "learning_rate": 4.530712849451903e-06, "loss": 0.005, "step": 182210 }, { "epoch": 1.97, "learning_rate": 4.5144969838489975e-06, "loss": 0.0057, "step": 182220 }, { "epoch": 1.97, "learning_rate": 4.498281118246091e-06, "loss": 0.0057, "step": 182230 }, { "epoch": 1.97, "learning_rate": 4.4820652526431856e-06, "loss": 0.0058, "step": 182240 }, { "epoch": 1.97, "learning_rate": 4.46584938704028e-06, "loss": 0.0055, "step": 182250 }, { "epoch": 1.97, "learning_rate": 4.449633521437374e-06, "loss": 0.0072, "step": 182260 }, { "epoch": 1.97, "learning_rate": 4.433417655834468e-06, "loss": 0.009, "step": 182270 }, { "epoch": 1.97, "learning_rate": 4.4172017902315625e-06, "loss": 0.0057, "step": 182280 }, { "epoch": 1.97, "learning_rate": 4.400985924628656e-06, "loss": 0.0062, "step": 182290 }, { "epoch": 1.97, "learning_rate": 4.3847700590257505e-06, "loss": 0.0047, "step": 182300 }, { "epoch": 1.97, "learning_rate": 4.368554193422844e-06, "loss": 0.0055, "step": 182310 }, { "epoch": 1.97, "learning_rate": 4.3523383278199385e-06, "loss": 0.0066, "step": 182320 }, { "epoch": 1.97, "learning_rate": 4.336122462217033e-06, "loss": 0.0052, "step": 182330 }, { "epoch": 1.97, "learning_rate": 4.3199065966141265e-06, "loss": 0.0118, "step": 182340 }, { "epoch": 1.97, "learning_rate": 4.303690731011221e-06, "loss": 0.0061, "step": 182350 }, { "epoch": 1.97, "learning_rate": 4.287474865408315e-06, "loss": 0.0073, "step": 182360 }, { "epoch": 1.97, "learning_rate": 4.27125899980541e-06, "loss": 0.0062, "step": 182370 }, { "epoch": 1.97, "learning_rate": 4.2550431342025035e-06, "loss": 0.0057, "step": 182380 }, { "epoch": 1.97, "learning_rate": 4.238827268599597e-06, "loss": 0.0054, "step": 182390 }, { "epoch": 1.97, "learning_rate": 4.2226114029966915e-06, "loss": 0.0053, "step": 182400 }, { "epoch": 1.97, "learning_rate": 4.206395537393785e-06, "loss": 0.0077, "step": 182410 }, { "epoch": 1.97, "learning_rate": 4.19017967179088e-06, "loss": 0.0049, "step": 182420 }, { "epoch": 1.97, "learning_rate": 4.173963806187974e-06, "loss": 0.0061, "step": 182430 }, { "epoch": 1.97, "learning_rate": 4.157747940585068e-06, "loss": 0.0053, "step": 182440 }, { "epoch": 1.97, "learning_rate": 4.141532074982162e-06, "loss": 0.0061, "step": 182450 }, { "epoch": 1.97, "learning_rate": 4.125316209379256e-06, "loss": 0.0088, "step": 182460 }, { "epoch": 1.97, "learning_rate": 4.109100343776351e-06, "loss": 0.0065, "step": 182470 }, { "epoch": 1.97, "learning_rate": 4.0928844781734444e-06, "loss": 0.0085, "step": 182480 }, { "epoch": 1.97, "learning_rate": 4.076668612570539e-06, "loss": 0.007, "step": 182490 }, { "epoch": 1.97, "learning_rate": 4.060452746967633e-06, "loss": 0.0092, "step": 182500 }, { "epoch": 1.97, "learning_rate": 4.044236881364727e-06, "loss": 0.0059, "step": 182510 }, { "epoch": 1.97, "learning_rate": 4.028021015761821e-06, "loss": 0.0085, "step": 182520 }, { "epoch": 1.97, "learning_rate": 4.011805150158915e-06, "loss": 0.005, "step": 182530 }, { "epoch": 1.97, "learning_rate": 3.995589284556009e-06, "loss": 0.0054, "step": 182540 }, { "epoch": 1.97, "learning_rate": 3.979373418953104e-06, "loss": 0.0055, "step": 182550 }, { "epoch": 1.97, "learning_rate": 3.963157553350197e-06, "loss": 0.0055, "step": 182560 }, { "epoch": 1.97, "learning_rate": 3.946941687747292e-06, "loss": 0.0039, "step": 182570 }, { "epoch": 1.97, "learning_rate": 3.9307258221443854e-06, "loss": 0.0072, "step": 182580 }, { "epoch": 1.97, "learning_rate": 3.91450995654148e-06, "loss": 0.0052, "step": 182590 }, { "epoch": 1.97, "learning_rate": 3.898294090938574e-06, "loss": 0.0073, "step": 182600 }, { "epoch": 1.97, "learning_rate": 3.882078225335668e-06, "loss": 0.0083, "step": 182610 }, { "epoch": 1.97, "learning_rate": 3.865862359732762e-06, "loss": 0.0099, "step": 182620 }, { "epoch": 1.97, "learning_rate": 3.849646494129856e-06, "loss": 0.0066, "step": 182630 }, { "epoch": 1.97, "learning_rate": 3.83343062852695e-06, "loss": 0.0075, "step": 182640 }, { "epoch": 1.97, "learning_rate": 3.817214762924045e-06, "loss": 0.006, "step": 182650 }, { "epoch": 1.97, "learning_rate": 3.800998897321139e-06, "loss": 0.0056, "step": 182660 }, { "epoch": 1.97, "learning_rate": 3.784783031718233e-06, "loss": 0.0054, "step": 182670 }, { "epoch": 1.97, "learning_rate": 3.7685671661153273e-06, "loss": 0.0054, "step": 182680 }, { "epoch": 1.97, "learning_rate": 3.7523513005124213e-06, "loss": 0.0053, "step": 182690 }, { "epoch": 1.98, "learning_rate": 3.7361354349095153e-06, "loss": 0.0054, "step": 182700 }, { "epoch": 1.98, "learning_rate": 3.7199195693066093e-06, "loss": 0.0055, "step": 182710 }, { "epoch": 1.98, "learning_rate": 3.7037037037037033e-06, "loss": 0.0051, "step": 182720 }, { "epoch": 1.98, "learning_rate": 3.6874878381007978e-06, "loss": 0.0049, "step": 182730 }, { "epoch": 1.98, "learning_rate": 3.6712719724978918e-06, "loss": 0.0118, "step": 182740 }, { "epoch": 1.98, "learning_rate": 3.6550561068949858e-06, "loss": 0.0058, "step": 182750 }, { "epoch": 1.98, "learning_rate": 3.63884024129208e-06, "loss": 0.007, "step": 182760 }, { "epoch": 1.98, "learning_rate": 3.6226243756891742e-06, "loss": 0.0053, "step": 182770 }, { "epoch": 1.98, "learning_rate": 3.6064085100862682e-06, "loss": 0.0054, "step": 182780 }, { "epoch": 1.98, "learning_rate": 3.5901926444833623e-06, "loss": 0.0063, "step": 182790 }, { "epoch": 1.98, "learning_rate": 3.5739767788804563e-06, "loss": 0.0049, "step": 182800 }, { "epoch": 1.98, "learning_rate": 3.5577609132775503e-06, "loss": 0.0051, "step": 182810 }, { "epoch": 1.98, "learning_rate": 3.5415450476746447e-06, "loss": 0.007, "step": 182820 }, { "epoch": 1.98, "learning_rate": 3.5253291820717387e-06, "loss": 0.0083, "step": 182830 }, { "epoch": 1.98, "learning_rate": 3.5091133164688328e-06, "loss": 0.0044, "step": 182840 }, { "epoch": 1.98, "learning_rate": 3.4928974508659268e-06, "loss": 0.0063, "step": 182850 }, { "epoch": 1.98, "learning_rate": 3.476681585263021e-06, "loss": 0.0061, "step": 182860 }, { "epoch": 1.98, "learning_rate": 3.4604657196601152e-06, "loss": 0.0076, "step": 182870 }, { "epoch": 1.98, "learning_rate": 3.4442498540572092e-06, "loss": 0.0063, "step": 182880 }, { "epoch": 1.98, "learning_rate": 3.4280339884543032e-06, "loss": 0.0054, "step": 182890 }, { "epoch": 1.98, "learning_rate": 3.4118181228513973e-06, "loss": 0.0054, "step": 182900 }, { "epoch": 1.98, "learning_rate": 3.3956022572484917e-06, "loss": 0.0076, "step": 182910 }, { "epoch": 1.98, "learning_rate": 3.3793863916455857e-06, "loss": 0.0054, "step": 182920 }, { "epoch": 1.98, "learning_rate": 3.3631705260426797e-06, "loss": 0.0046, "step": 182930 }, { "epoch": 1.98, "learning_rate": 3.3469546604397737e-06, "loss": 0.0063, "step": 182940 }, { "epoch": 1.98, "learning_rate": 3.330738794836868e-06, "loss": 0.007, "step": 182950 }, { "epoch": 1.98, "learning_rate": 3.314522929233962e-06, "loss": 0.0073, "step": 182960 }, { "epoch": 1.98, "learning_rate": 3.298307063631056e-06, "loss": 0.0068, "step": 182970 }, { "epoch": 1.98, "learning_rate": 3.2820911980281502e-06, "loss": 0.0048, "step": 182980 }, { "epoch": 1.98, "learning_rate": 3.2658753324252442e-06, "loss": 0.0063, "step": 182990 }, { "epoch": 1.98, "learning_rate": 3.249659466822339e-06, "loss": 0.0054, "step": 183000 }, { "epoch": 1.98, "eval_cer": 0.9215000078174266, "eval_loss": 0.005184313748031855, "eval_runtime": 121.1588, "eval_samples_per_second": 16.507, "eval_steps_per_second": 4.127, "step": 183000 }, { "epoch": 1.98, "learning_rate": 3.2334436012194327e-06, "loss": 0.0077, "step": 183010 }, { "epoch": 1.98, "learning_rate": 3.2172277356165267e-06, "loss": 0.0052, "step": 183020 }, { "epoch": 1.98, "learning_rate": 3.2010118700136207e-06, "loss": 0.0052, "step": 183030 }, { "epoch": 1.98, "learning_rate": 3.1847960044107156e-06, "loss": 0.0044, "step": 183040 }, { "epoch": 1.98, "learning_rate": 3.1685801388078096e-06, "loss": 0.0057, "step": 183050 }, { "epoch": 1.98, "learning_rate": 3.1523642732049036e-06, "loss": 0.0059, "step": 183060 }, { "epoch": 1.98, "learning_rate": 3.1361484076019976e-06, "loss": 0.0054, "step": 183070 }, { "epoch": 1.98, "learning_rate": 3.1199325419990916e-06, "loss": 0.0061, "step": 183080 }, { "epoch": 1.98, "learning_rate": 3.103716676396186e-06, "loss": 0.0059, "step": 183090 }, { "epoch": 1.98, "learning_rate": 3.08750081079328e-06, "loss": 0.0053, "step": 183100 }, { "epoch": 1.98, "learning_rate": 3.071284945190374e-06, "loss": 0.0067, "step": 183110 }, { "epoch": 1.98, "learning_rate": 3.055069079587468e-06, "loss": 0.0051, "step": 183120 }, { "epoch": 1.98, "learning_rate": 3.0388532139845625e-06, "loss": 0.0066, "step": 183130 }, { "epoch": 1.98, "learning_rate": 3.0226373483816566e-06, "loss": 0.0069, "step": 183140 }, { "epoch": 1.98, "learning_rate": 3.0064214827787506e-06, "loss": 0.0062, "step": 183150 }, { "epoch": 1.98, "learning_rate": 2.9902056171758446e-06, "loss": 0.0056, "step": 183160 }, { "epoch": 1.98, "learning_rate": 2.9739897515729386e-06, "loss": 0.0054, "step": 183170 }, { "epoch": 1.98, "learning_rate": 2.957773885970033e-06, "loss": 0.0069, "step": 183180 }, { "epoch": 1.98, "learning_rate": 2.941558020367127e-06, "loss": 0.0042, "step": 183190 }, { "epoch": 1.98, "learning_rate": 2.925342154764221e-06, "loss": 0.0075, "step": 183200 }, { "epoch": 1.98, "learning_rate": 2.909126289161315e-06, "loss": 0.0072, "step": 183210 }, { "epoch": 1.98, "learning_rate": 2.8929104235584095e-06, "loss": 0.005, "step": 183220 }, { "epoch": 1.98, "learning_rate": 2.8766945579555035e-06, "loss": 0.0061, "step": 183230 }, { "epoch": 1.98, "learning_rate": 2.8604786923525976e-06, "loss": 0.0053, "step": 183240 }, { "epoch": 1.98, "learning_rate": 2.8442628267496916e-06, "loss": 0.007, "step": 183250 }, { "epoch": 1.98, "learning_rate": 2.8280469611467856e-06, "loss": 0.0078, "step": 183260 }, { "epoch": 1.98, "learning_rate": 2.81183109554388e-06, "loss": 0.0049, "step": 183270 }, { "epoch": 1.98, "learning_rate": 2.795615229940974e-06, "loss": 0.0118, "step": 183280 }, { "epoch": 1.98, "learning_rate": 2.779399364338068e-06, "loss": 0.0049, "step": 183290 }, { "epoch": 1.98, "learning_rate": 2.763183498735162e-06, "loss": 0.0073, "step": 183300 }, { "epoch": 1.98, "learning_rate": 2.7469676331322565e-06, "loss": 0.0066, "step": 183310 }, { "epoch": 1.98, "learning_rate": 2.7307517675293505e-06, "loss": 0.0075, "step": 183320 }, { "epoch": 1.98, "learning_rate": 2.7145359019264445e-06, "loss": 0.006, "step": 183330 }, { "epoch": 1.98, "learning_rate": 2.6983200363235385e-06, "loss": 0.0057, "step": 183340 }, { "epoch": 1.98, "learning_rate": 2.6821041707206326e-06, "loss": 0.0053, "step": 183350 }, { "epoch": 1.98, "learning_rate": 2.665888305117727e-06, "loss": 0.0074, "step": 183360 }, { "epoch": 1.98, "learning_rate": 2.649672439514821e-06, "loss": 0.0069, "step": 183370 }, { "epoch": 1.98, "learning_rate": 2.633456573911915e-06, "loss": 0.0083, "step": 183380 }, { "epoch": 1.98, "learning_rate": 2.617240708309009e-06, "loss": 0.0059, "step": 183390 }, { "epoch": 1.98, "learning_rate": 2.6010248427061035e-06, "loss": 0.0061, "step": 183400 }, { "epoch": 1.98, "learning_rate": 2.5848089771031975e-06, "loss": 0.0079, "step": 183410 }, { "epoch": 1.98, "learning_rate": 2.5685931115002915e-06, "loss": 0.0049, "step": 183420 }, { "epoch": 1.98, "learning_rate": 2.5523772458973855e-06, "loss": 0.0054, "step": 183430 }, { "epoch": 1.98, "learning_rate": 2.5361613802944795e-06, "loss": 0.0049, "step": 183440 }, { "epoch": 1.98, "learning_rate": 2.5199455146915744e-06, "loss": 0.0067, "step": 183450 }, { "epoch": 1.98, "learning_rate": 2.5037296490886684e-06, "loss": 0.0045, "step": 183460 }, { "epoch": 1.98, "learning_rate": 2.4875137834857624e-06, "loss": 0.0061, "step": 183470 }, { "epoch": 1.98, "learning_rate": 2.471297917882856e-06, "loss": 0.0062, "step": 183480 }, { "epoch": 1.98, "learning_rate": 2.455082052279951e-06, "loss": 0.0056, "step": 183490 }, { "epoch": 1.98, "learning_rate": 2.438866186677045e-06, "loss": 0.0062, "step": 183500 }, { "epoch": 1.98, "learning_rate": 2.422650321074139e-06, "loss": 0.0045, "step": 183510 }, { "epoch": 1.98, "learning_rate": 2.406434455471233e-06, "loss": 0.0057, "step": 183520 }, { "epoch": 1.98, "learning_rate": 2.390218589868327e-06, "loss": 0.0065, "step": 183530 }, { "epoch": 1.98, "learning_rate": 2.3740027242654214e-06, "loss": 0.0086, "step": 183540 }, { "epoch": 1.98, "learning_rate": 2.3577868586625154e-06, "loss": 0.0067, "step": 183550 }, { "epoch": 1.98, "learning_rate": 2.3415709930596094e-06, "loss": 0.0064, "step": 183560 }, { "epoch": 1.98, "learning_rate": 2.3253551274567034e-06, "loss": 0.0055, "step": 183570 }, { "epoch": 1.98, "learning_rate": 2.3091392618537974e-06, "loss": 0.0051, "step": 183580 }, { "epoch": 1.98, "learning_rate": 2.2929233962508914e-06, "loss": 0.0059, "step": 183590 }, { "epoch": 1.98, "learning_rate": 2.276707530647986e-06, "loss": 0.0062, "step": 183600 }, { "epoch": 1.98, "learning_rate": 2.26049166504508e-06, "loss": 0.0077, "step": 183610 }, { "epoch": 1.99, "learning_rate": 2.244275799442174e-06, "loss": 0.0061, "step": 183620 }, { "epoch": 1.99, "learning_rate": 2.228059933839268e-06, "loss": 0.0077, "step": 183630 }, { "epoch": 1.99, "learning_rate": 2.2118440682363623e-06, "loss": 0.0089, "step": 183640 }, { "epoch": 1.99, "learning_rate": 2.1956282026334564e-06, "loss": 0.005, "step": 183650 }, { "epoch": 1.99, "learning_rate": 2.179412337030551e-06, "loss": 0.0084, "step": 183660 }, { "epoch": 1.99, "learning_rate": 2.163196471427645e-06, "loss": 0.0051, "step": 183670 }, { "epoch": 1.99, "learning_rate": 2.1469806058247384e-06, "loss": 0.0051, "step": 183680 }, { "epoch": 1.99, "learning_rate": 2.130764740221833e-06, "loss": 0.0047, "step": 183690 }, { "epoch": 1.99, "learning_rate": 2.114548874618927e-06, "loss": 0.0058, "step": 183700 }, { "epoch": 1.99, "learning_rate": 2.0983330090160213e-06, "loss": 0.0066, "step": 183710 }, { "epoch": 1.99, "learning_rate": 2.0821171434131153e-06, "loss": 0.0077, "step": 183720 }, { "epoch": 1.99, "learning_rate": 2.0659012778102093e-06, "loss": 0.0051, "step": 183730 }, { "epoch": 1.99, "learning_rate": 2.0496854122073033e-06, "loss": 0.0077, "step": 183740 }, { "epoch": 1.99, "learning_rate": 2.0334695466043978e-06, "loss": 0.0061, "step": 183750 }, { "epoch": 1.99, "learning_rate": 2.0172536810014918e-06, "loss": 0.0062, "step": 183760 }, { "epoch": 1.99, "learning_rate": 2.001037815398586e-06, "loss": 0.006, "step": 183770 }, { "epoch": 1.99, "learning_rate": 1.98482194979568e-06, "loss": 0.0048, "step": 183780 }, { "epoch": 1.99, "learning_rate": 1.968606084192774e-06, "loss": 0.0076, "step": 183790 }, { "epoch": 1.99, "learning_rate": 1.9523902185898683e-06, "loss": 0.0056, "step": 183800 }, { "epoch": 1.99, "learning_rate": 1.9361743529869623e-06, "loss": 0.0052, "step": 183810 }, { "epoch": 1.99, "learning_rate": 1.9199584873840563e-06, "loss": 0.0065, "step": 183820 }, { "epoch": 1.99, "learning_rate": 1.9037426217811505e-06, "loss": 0.0072, "step": 183830 }, { "epoch": 1.99, "learning_rate": 1.8875267561782447e-06, "loss": 0.0057, "step": 183840 }, { "epoch": 1.99, "learning_rate": 1.8713108905753388e-06, "loss": 0.0057, "step": 183850 }, { "epoch": 1.99, "learning_rate": 1.855095024972433e-06, "loss": 0.0072, "step": 183860 }, { "epoch": 1.99, "learning_rate": 1.838879159369527e-06, "loss": 0.0067, "step": 183870 }, { "epoch": 1.99, "learning_rate": 1.822663293766621e-06, "loss": 0.007, "step": 183880 }, { "epoch": 1.99, "learning_rate": 1.8064474281637152e-06, "loss": 0.0049, "step": 183890 }, { "epoch": 1.99, "learning_rate": 1.7902315625608093e-06, "loss": 0.0055, "step": 183900 }, { "epoch": 1.99, "learning_rate": 1.7740156969579035e-06, "loss": 0.0055, "step": 183910 }, { "epoch": 1.99, "learning_rate": 1.7577998313549975e-06, "loss": 0.0059, "step": 183920 }, { "epoch": 1.99, "learning_rate": 1.7415839657520917e-06, "loss": 0.0055, "step": 183930 }, { "epoch": 1.99, "learning_rate": 1.7253681001491857e-06, "loss": 0.0081, "step": 183940 }, { "epoch": 1.99, "learning_rate": 1.70915223454628e-06, "loss": 0.006, "step": 183950 }, { "epoch": 1.99, "learning_rate": 1.692936368943374e-06, "loss": 0.0067, "step": 183960 }, { "epoch": 1.99, "learning_rate": 1.676720503340468e-06, "loss": 0.0071, "step": 183970 }, { "epoch": 1.99, "learning_rate": 1.6605046377375624e-06, "loss": 0.005, "step": 183980 }, { "epoch": 1.99, "learning_rate": 1.6442887721346562e-06, "loss": 0.0063, "step": 183990 }, { "epoch": 1.99, "learning_rate": 1.6280729065317507e-06, "loss": 0.0053, "step": 184000 }, { "epoch": 1.99, "eval_cer": 0.9215069566410776, "eval_loss": 0.0051878588274121284, "eval_runtime": 121.2445, "eval_samples_per_second": 16.496, "eval_steps_per_second": 4.124, "step": 184000 }, { "epoch": 1.99, "learning_rate": 1.6118570409288447e-06, "loss": 0.0054, "step": 184010 }, { "epoch": 1.99, "learning_rate": 1.595641175325939e-06, "loss": 0.0059, "step": 184020 }, { "epoch": 1.99, "learning_rate": 1.579425309723033e-06, "loss": 0.0077, "step": 184030 }, { "epoch": 1.99, "learning_rate": 1.5632094441201271e-06, "loss": 0.0083, "step": 184040 }, { "epoch": 1.99, "learning_rate": 1.5469935785172212e-06, "loss": 0.0075, "step": 184050 }, { "epoch": 1.99, "learning_rate": 1.5307777129143152e-06, "loss": 0.0062, "step": 184060 }, { "epoch": 1.99, "learning_rate": 1.5145618473114094e-06, "loss": 0.0052, "step": 184070 }, { "epoch": 1.99, "learning_rate": 1.4983459817085034e-06, "loss": 0.0049, "step": 184080 }, { "epoch": 1.99, "learning_rate": 1.4821301161055976e-06, "loss": 0.0053, "step": 184090 }, { "epoch": 1.99, "learning_rate": 1.4659142505026916e-06, "loss": 0.0052, "step": 184100 }, { "epoch": 1.99, "learning_rate": 1.4496983848997859e-06, "loss": 0.0056, "step": 184110 }, { "epoch": 1.99, "learning_rate": 1.4334825192968799e-06, "loss": 0.008, "step": 184120 }, { "epoch": 1.99, "learning_rate": 1.4172666536939741e-06, "loss": 0.0047, "step": 184130 }, { "epoch": 1.99, "learning_rate": 1.4010507880910681e-06, "loss": 0.0043, "step": 184140 }, { "epoch": 1.99, "learning_rate": 1.3848349224881621e-06, "loss": 0.0061, "step": 184150 }, { "epoch": 1.99, "learning_rate": 1.3686190568852564e-06, "loss": 0.0055, "step": 184160 }, { "epoch": 1.99, "learning_rate": 1.3524031912823504e-06, "loss": 0.005, "step": 184170 }, { "epoch": 1.99, "learning_rate": 1.3361873256794448e-06, "loss": 0.0061, "step": 184180 }, { "epoch": 1.99, "learning_rate": 1.3199714600765386e-06, "loss": 0.0069, "step": 184190 }, { "epoch": 1.99, "learning_rate": 1.303755594473633e-06, "loss": 0.0056, "step": 184200 }, { "epoch": 1.99, "learning_rate": 1.287539728870727e-06, "loss": 0.007, "step": 184210 }, { "epoch": 1.99, "learning_rate": 1.2713238632678213e-06, "loss": 0.0057, "step": 184220 }, { "epoch": 1.99, "learning_rate": 1.2551079976649153e-06, "loss": 0.0072, "step": 184230 }, { "epoch": 1.99, "learning_rate": 1.2388921320620093e-06, "loss": 0.0076, "step": 184240 }, { "epoch": 1.99, "learning_rate": 1.2226762664591036e-06, "loss": 0.0051, "step": 184250 }, { "epoch": 1.99, "learning_rate": 1.2064604008561976e-06, "loss": 0.0068, "step": 184260 }, { "epoch": 1.99, "learning_rate": 1.1902445352532918e-06, "loss": 0.0053, "step": 184270 }, { "epoch": 1.99, "learning_rate": 1.1740286696503858e-06, "loss": 0.0054, "step": 184280 }, { "epoch": 1.99, "learning_rate": 1.1578128040474798e-06, "loss": 0.008, "step": 184290 }, { "epoch": 1.99, "learning_rate": 1.141596938444574e-06, "loss": 0.0057, "step": 184300 }, { "epoch": 1.99, "learning_rate": 1.1253810728416683e-06, "loss": 0.005, "step": 184310 }, { "epoch": 1.99, "learning_rate": 1.1091652072387623e-06, "loss": 0.0079, "step": 184320 }, { "epoch": 1.99, "learning_rate": 1.0929493416358565e-06, "loss": 0.0051, "step": 184330 }, { "epoch": 1.99, "learning_rate": 1.0767334760329505e-06, "loss": 0.008, "step": 184340 }, { "epoch": 1.99, "learning_rate": 1.0605176104300448e-06, "loss": 0.0047, "step": 184350 }, { "epoch": 1.99, "learning_rate": 1.0443017448271388e-06, "loss": 0.0034, "step": 184360 }, { "epoch": 1.99, "learning_rate": 1.0280858792242328e-06, "loss": 0.004, "step": 184370 }, { "epoch": 1.99, "learning_rate": 1.011870013621327e-06, "loss": 0.0054, "step": 184380 }, { "epoch": 1.99, "learning_rate": 9.95654148018421e-07, "loss": 0.0073, "step": 184390 }, { "epoch": 1.99, "learning_rate": 9.794382824155152e-07, "loss": 0.0067, "step": 184400 }, { "epoch": 1.99, "learning_rate": 9.632224168126095e-07, "loss": 0.0065, "step": 184410 }, { "epoch": 1.99, "learning_rate": 9.470065512097035e-07, "loss": 0.005, "step": 184420 }, { "epoch": 1.99, "learning_rate": 9.307906856067976e-07, "loss": 0.007, "step": 184430 }, { "epoch": 1.99, "learning_rate": 9.145748200038918e-07, "loss": 0.0073, "step": 184440 }, { "epoch": 1.99, "learning_rate": 8.98358954400986e-07, "loss": 0.006, "step": 184450 }, { "epoch": 1.99, "learning_rate": 8.8214308879808e-07, "loss": 0.0045, "step": 184460 }, { "epoch": 1.99, "learning_rate": 8.659272231951741e-07, "loss": 0.0058, "step": 184470 }, { "epoch": 1.99, "learning_rate": 8.497113575922682e-07, "loss": 0.0065, "step": 184480 }, { "epoch": 1.99, "learning_rate": 8.334954919893623e-07, "loss": 0.0054, "step": 184490 }, { "epoch": 1.99, "learning_rate": 8.172796263864564e-07, "loss": 0.0053, "step": 184500 }, { "epoch": 1.99, "learning_rate": 8.010637607835506e-07, "loss": 0.0052, "step": 184510 }, { "epoch": 1.99, "learning_rate": 7.848478951806447e-07, "loss": 0.0057, "step": 184520 }, { "epoch": 1.99, "learning_rate": 7.686320295777388e-07, "loss": 0.0077, "step": 184530 }, { "epoch": 1.99, "learning_rate": 7.524161639748329e-07, "loss": 0.0056, "step": 184540 }, { "epoch": 2.0, "learning_rate": 7.362002983719269e-07, "loss": 0.0061, "step": 184550 }, { "epoch": 2.0, "learning_rate": 7.199844327690211e-07, "loss": 0.0067, "step": 184560 }, { "epoch": 2.0, "learning_rate": 7.037685671661153e-07, "loss": 0.0073, "step": 184570 }, { "epoch": 2.0, "learning_rate": 6.875527015632094e-07, "loss": 0.0061, "step": 184580 }, { "epoch": 2.0, "learning_rate": 6.713368359603035e-07, "loss": 0.0072, "step": 184590 }, { "epoch": 2.0, "learning_rate": 6.551209703573976e-07, "loss": 0.0053, "step": 184600 }, { "epoch": 2.0, "learning_rate": 6.389051047544918e-07, "loss": 0.0105, "step": 184610 }, { "epoch": 2.0, "learning_rate": 6.226892391515859e-07, "loss": 0.007, "step": 184620 }, { "epoch": 2.0, "learning_rate": 6.0647337354868e-07, "loss": 0.0056, "step": 184630 }, { "epoch": 2.0, "learning_rate": 5.90257507945774e-07, "loss": 0.0056, "step": 184640 }, { "epoch": 2.0, "learning_rate": 5.740416423428682e-07, "loss": 0.006, "step": 184650 }, { "epoch": 2.0, "learning_rate": 5.578257767399623e-07, "loss": 0.0059, "step": 184660 }, { "epoch": 2.0, "learning_rate": 5.416099111370565e-07, "loss": 0.005, "step": 184670 }, { "epoch": 2.0, "learning_rate": 5.253940455341506e-07, "loss": 0.0053, "step": 184680 }, { "epoch": 2.0, "learning_rate": 5.091781799312447e-07, "loss": 0.0058, "step": 184690 }, { "epoch": 2.0, "learning_rate": 4.929623143283388e-07, "loss": 0.0059, "step": 184700 }, { "epoch": 2.0, "learning_rate": 4.767464487254329e-07, "loss": 0.0051, "step": 184710 }, { "epoch": 2.0, "learning_rate": 4.6053058312252703e-07, "loss": 0.0037, "step": 184720 }, { "epoch": 2.0, "learning_rate": 4.4431471751962115e-07, "loss": 0.0066, "step": 184730 }, { "epoch": 2.0, "learning_rate": 4.280988519167153e-07, "loss": 0.0069, "step": 184740 }, { "epoch": 2.0, "learning_rate": 4.118829863138094e-07, "loss": 0.006, "step": 184750 }, { "epoch": 2.0, "learning_rate": 3.956671207109035e-07, "loss": 0.0049, "step": 184760 }, { "epoch": 2.0, "learning_rate": 3.7945125510799763e-07, "loss": 0.0068, "step": 184770 }, { "epoch": 2.0, "learning_rate": 3.6323538950509175e-07, "loss": 0.0065, "step": 184780 }, { "epoch": 2.0, "learning_rate": 3.470195239021859e-07, "loss": 0.0064, "step": 184790 }, { "epoch": 2.0, "learning_rate": 3.3080365829928e-07, "loss": 0.0065, "step": 184800 }, { "epoch": 2.0, "learning_rate": 3.145877926963741e-07, "loss": 0.0082, "step": 184810 }, { "epoch": 2.0, "learning_rate": 2.983719270934682e-07, "loss": 0.0052, "step": 184820 }, { "epoch": 2.0, "learning_rate": 2.8215606149056235e-07, "loss": 0.0047, "step": 184830 }, { "epoch": 2.0, "learning_rate": 2.6594019588765647e-07, "loss": 0.008, "step": 184840 }, { "epoch": 2.0, "learning_rate": 2.497243302847506e-07, "loss": 0.006, "step": 184850 }, { "epoch": 2.0, "learning_rate": 2.335084646818447e-07, "loss": 0.0063, "step": 184860 }, { "epoch": 2.0, "learning_rate": 2.1729259907893883e-07, "loss": 0.0061, "step": 184870 }, { "epoch": 2.0, "learning_rate": 2.0107673347603292e-07, "loss": 0.0079, "step": 184880 }, { "epoch": 2.0, "learning_rate": 1.8486086787312707e-07, "loss": 0.0053, "step": 184890 }, { "epoch": 2.0, "learning_rate": 1.6864500227022116e-07, "loss": 0.0054, "step": 184900 }, { "epoch": 2.0, "learning_rate": 1.524291366673153e-07, "loss": 0.0083, "step": 184910 }, { "epoch": 2.0, "learning_rate": 1.3621327106440942e-07, "loss": 0.0056, "step": 184920 }, { "epoch": 2.0, "learning_rate": 1.1999740546150352e-07, "loss": 0.0057, "step": 184930 }, { "epoch": 2.0, "learning_rate": 1.0378153985859765e-07, "loss": 0.0058, "step": 184940 }, { "epoch": 2.0, "learning_rate": 8.756567425569176e-08, "loss": 0.0056, "step": 184950 }, { "epoch": 2.0, "learning_rate": 7.134980865278588e-08, "loss": 0.006, "step": 184960 }, { "epoch": 2.0, "learning_rate": 5.513394304988e-08, "loss": 0.0064, "step": 184970 }, { "epoch": 2.0, "learning_rate": 3.891807744697412e-08, "loss": 0.0057, "step": 184980 }, { "epoch": 2.0, "learning_rate": 2.2702211844068234e-08, "loss": 0.0055, "step": 184990 }, { "epoch": 2.0, "learning_rate": 6.486346241162353e-09, "loss": 0.0066, "step": 185000 }, { "epoch": 2.0, "eval_cer": 0.9215104310529031, "eval_loss": 0.005186900030821562, "eval_runtime": 121.1763, "eval_samples_per_second": 16.505, "eval_steps_per_second": 4.126, "step": 185000 }, { "epoch": 2.0, "step": 185004, "total_flos": 9.988292384850125e+17, "train_loss": 0.016045775709704408, "train_runtime": 206173.8627, "train_samples_per_second": 28.714, "train_steps_per_second": 0.897 } ], "max_steps": 185004, "num_train_epochs": 2, "total_flos": 9.988292384850125e+17, "trial_name": null, "trial_params": null }